# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_23	LOCUS_00220	sequence001:30638..31099(-)	partial			WP_004114571.1	30S ribosomal protein S16	69.3	69.3	97.2
MGA_41	LOCUS_00400	sequence001:49705..50025(+)	partial			WP_004574855.1	hypothetical protein	100.0	73.6	100.0
MGA_63	LOCUS_00620	sequence001:81032..81319(+)	frameshift		81313	WP_004117424.1	histidine phosphatase family protein	100.0	42.4	100.0
MGA_64	LOCUS_00630	sequence001:81294..81707(+)	frameshift		81313	WP_004117424.1	histidine phosphatase family protein	94.9	58.0	100.0
MGA_86	LOCUS_00830	sequence002:16975..17454(+)	frameshift		17406,17422	WP_013399502.1	GTPase HflX	80.5	26.2	96.1
MGA_87	LOCUS_00840	sequence002:17487..18494(+)	frameshift		17406,17422	WP_013399502.1	GTPase HflX	100.0	68.5	99.1
MGA_94	LOCUS_00910	sequence002:23634..25250(-)	frameshift		25296	WP_020760760.1	DUF4037 domain-containing protein	100.0	78.5	99.3
MGA_95	LOCUS_00920	sequence002:25282..25692(-)	frameshift		25296	WP_020760760.1	DUF4037 domain-containing protein	97.8	19.4	99.2
MGA_137	LOCUS_01330	sequence003:27039..28091(+)	frameshift		28040,28072,28088,28062	WP_013399520.1	glutamine-hydrolyzing GMP synthase	100.0	67.1	96.6
MGA_138	LOCUS_01340	sequence003:28159..28605(+)	frameshift		28072,28065,28043,28088	WP_013399520.1	glutamine-hydrolyzing GMP synthase	100.0	28.5	99.3
MGA_154	LOCUS_01490	sequence004:1..1502(+)	partial			WP_004111766.1	carbamoyl-phosphate synthase large subunit	100.0	44.1	99.2
MGA_167	LOCUS_01620	sequence004:14063..14296(+)	partial			WP_091232349.1	restriction endonuclease subunit S	75.3	18.9	48.3
MGA_170	LOCUS_01650	sequence004:15503..16168(+)	partial			WP_108806778.1	recombinase family protein	100.0	42.1	95.5
MGA_187	LOCUS_01820	sequence004:30541..30702(+)	partial			WP_201275746.1	transposon-encoded TnpW family protein	75.5	48.8	78.0
MGA_199	LOCUS_01940	sequence004:40638..41225(+)	partial			WP_116438320.1	YcxB family protein	100.0	45.0	89.2
MGA_221	LOCUS_02140	sequence005:12435..12968(+)	partial			WP_009994709.1	DUF6350 family protein	100.0	33.3	97.2
MGA_223	LOCUS_02160	sequence005:14789..15037(+)	partial			WP_004113661.1	DUF3017 domain-containing protein	98.8	62.8	100.0
MGA_224	LOCUS_02170	sequence005:15157..15309(+)	partial			WP_004113665.1	pseudouridine synthase	100.0	19.5	98.0
MGA_240	LOCUS_02330	sequence005:40739..41005(+)	frameshift		40993,41085,41045	WP_004111603.1	histidine--tRNA ligase	97.7	18.5	96.5
MGA_241	LOCUS_02340	sequence005:41156..42148(+)	frameshift		41048,40993,41085	WP_004111603.1	histidine--tRNA ligase	100.0	70.8	98.8
MGA_274	LOCUS_02650	sequence006:39270..39983(+)	partial			WP_013399469.1	glycosyltransferase	96.2	60.8	98.2
MGA_292	LOCUS_02820	sequence007:17716..17946(-)	frameshift,internal_stop_codon	17962..17964(-)	18046	WP_016475763.1	BRO family protein	77.6	21.1	76.3
MGA_304	LOCUS_02940	sequence007:34379..34825(+)	frameshift		34810	WP_004114280.1	glucose-6-phosphate dehydrogenase assembly protein OpcA	97.3	45.4	97.9
MGA_305	LOCUS_02950	sequence007:34815..35333(+)	frameshift		34810	WP_004114280.1	glucose-6-phosphate dehydrogenase assembly protein OpcA	100.0	54.3	100.0
MGA_307	LOCUS_02970	sequence007:36435..37043(-)	frameshift		37035	WP_013399773.1	NADP-dependent phosphogluconate dehydrogenase	99.0	41.2	99.5
MGA_309	LOCUS_02980	sequence008:1360..4899(+)	internal_stop_codon	4897..4899(+)		WP_013399490.1	S8 family serine peptidase	100.0	58.8	98.4
MGA_310	LOCUS_02990	sequence008:5014..7374(+)	internal_stop_codon	4897..4899(+)		WP_013399490.1	S8 family serine peptidase	100.0	39.2	91.9
MGA_347	LOCUS_03340	sequence010:15114..15707(-)	frameshift		15724	WP_013399334.1	ABC transporter permease	100.0	21.3	93.4
MGA_348	LOCUS_03350	sequence010:15704..17890(-)	frameshift		15724	WP_013399334.1	ABC transporter permease	96.8	76.3	97.7
MGA_371	LOCUS_03580	sequence011:5953..6798(-)	frameshift		6908,6886	WP_013399489.1	phospho-N-acetylmuramoyl-pentapeptide-transferase	100.0	76.6	97.2
MGA_372	LOCUS_03590	sequence011:6870..7058(-)	frameshift		6908,6886	WP_013399489.1	phospho-N-acetylmuramoyl-pentapeptide-transferase	85.5	14.4	92.5
MGA_393	LOCUS_03800	sequence011:30878..31264(+)	partial			WP_004112250.1	sugar ABC transporter permease	100.0	40.8	100.0
MGA_397	LOCUS_03840	sequence012:1..738(+)	partial			WP_013399363.1	DNA gyrase subunit A	100.0	27.9	99.6
MGA_410	LOCUS_03970	sequence013:1..614(+)	partial			WP_013399360.1	murein biosynthesis integral membrane protein MurJ	100.0	34.1	92.6
MGA_425	LOCUS_04120	sequence013:17972..19714(+)	partial			WP_013399363.1	DNA gyrase subunit A	98.6	65.1	100.0
MGA_453	LOCUS_04380	sequence015:5774..6907(-)	frameshift		6908,6975	WP_004116039.1	preprotein translocase subunit SecY	100.0	84.5	97.3
MGA_475	LOCUS_04600	sequence015:17256..18002(-)	internal_stop_codon	18093..18095(-)		WP_180947085.1	bifunctional acetaldehyde-CoA/alcohol dehydrogenase	100.0	27.5	98.4
MGA_476	LOCUS_04610	sequence015:18093..19961(-)	internal_stop_codon	18093..18095(-)		WP_180947085.1	bifunctional acetaldehyde-CoA/alcohol dehydrogenase	100.0	69.0	97.4
MGA_540	LOCUS_05160	sequence020:7014..>7787(-)	partial			WP_013399406.1	extracellular solute-binding protein	100.0	62.8	100.0
MGA_549	LOCUS_05250	sequence021:10215..10529(-)	frameshift		10570,10548,10583	WP_013399401.1	nitroreductase family protein	100.0	38.4	99.0
MGA_550	LOCUS_05260	sequence021:10557..11033(-)	frameshift		10570,10548,10583	WP_013399401.1	nitroreductase family protein	94.9	55.4	95.3
MGA_554	LOCUS_05300	sequence021:14383..14892(-)	frameshift		14905	WP_013399403.1	LacI family DNA-binding transcriptional regulator	100.0	49.9	96.4
MGA_555	LOCUS_05310	sequence021:14861..15403(-)	frameshift		14902	WP_013399403.1	LacI family DNA-binding transcriptional regulator	92.8	49.3	98.2
MGA_574	LOCUS_05480	sequence022:15345..15881(-)	partial			WP_009994383.1	phosphoribosyltransferase family protein	100.0	68.2	98.3
MGA_602	LOCUS_05730	sequence024:4820..5539(-)	frameshift		5771	WP_032840997.1	hypothetical protein	97.9	42.5	79.5
MGA_603	LOCUS_05740	sequence024:5769..6473(-)	frameshift		5804	WP_032840997.1	hypothetical protein	94.9	40.4	98.6
MGA_614	LOCUS_05850	sequence024:21784..22617(-)	partial			WP_004112200.1	anaerobic ribonucleoside-triphosphate reductase	100.0	33.9	99.6
MGA_615	LOCUS_05860	sequence025:1..635(+)	partial			WP_004120484.1	F0F1 ATP synthase subunit beta	100.0	42.4	100.0
MGA_635	LOCUS_06060	sequence026:40..1422(+)	partial			WP_009994308.1	hypothetical protein	8.9	16.9	70.7
MGA_649	LOCUS_06190	sequence027:3141..4187(-)	frameshift		4191,4301,4246,4359	WP_013399612.1	DNA translocase FtsK	100.0	37.9	99.7
MGA_650	LOCUS_06200	sequence027:4339..5898(-)	frameshift		4304,4249,4191,4359	WP_013399612.1	DNA translocase FtsK	99.0	56.1	90.9
MGA_659	LOCUS_06290	sequence027:19193..20197(+)	partial			WP_013399614.1	alpha/beta hydrolase-fold protein	100.0	72.9	100.0
MGA_663	LOCUS_06330	sequence027:23491..>24281(-)	partial			WP_004113596.1	5-(carboxyamino)imidazole ribonucleotide synthase	100.0	67.2	99.6
MGA_694	LOCUS_06600	sequence030:18276..>19438(-)	partial			WP_004114108.1	RNA degradosome polyphosphate kinase	100.0	51.8	97.4
MGA_695	LOCUS_06610	sequence031:89..382(+)	frameshift		75	WP_014554396.1	PTS sugar transporter subunit IIC	100.0	22.1	100.0
MGA_707	LOCUS_06720	sequence032:6017..7453(-)	partial			WP_009994308.1	hypothetical protein	11.7	21.4	60.7
MGA_732	LOCUS_06940	sequence034:416..1420(-)	internal_stop_codon	1505..1507(-)		WP_101886502.1	1,4-beta-N-acetylmuramidase	100.0	82.9	96.1
MGA_808	LOCUS_07570	sequence042:5022..5498(+)	frameshift		5393	WP_013399574.1	ComEC/Rec2 family competence protein	78.5	20.4	100.0
MGA_809	LOCUS_07580	sequence042:5489..6847(+)	frameshift		5423	WP_013399574.1	ComEC/Rec2 family competence protein	100.0	74.5	99.6
MGA_821	LOCUS_07700	sequence043:13698..14192(-)	internal_stop_codon	14214..14216(-)		WP_013399572.1	fructosamine kinase family protein	100.0	61.2	100.0
MGA_823	LOCUS_07720	sequence044:1179..1637(+)	partial			WP_009994082.1	MFS transporter	100.0	36.2	100.0
MGA_829	LOCUS_07780	sequence044:6651..7343(+)	partial			WP_004113739.1	hypothetical protein	100.0	59.6	97.8
MGA_835	LOCUS_07840	sequence045:1..766(+)	partial			WP_108806778.1	recombinase family protein	100.0	48.4	95.3
MGA_851	LOCUS_08000	sequence045:17019..>17552(-)	partial			WP_013399592.1	beta-carotene 15,15'-monooxygenase	100.0	24.0	98.9
MGA_893	LOCUS_08360	sequence049:11262..11993(+)	frameshift		11984	WP_013399551.1	DUF2075 domain-containing protein	99.2	33.2	99.6
MGA_894	LOCUS_08370	sequence049:11962..13443(+)	frameshift		11984	WP_013399551.1	DUF2075 domain-containing protein	99.0	67.2	96.9
MGA_898	LOCUS_08400	sequence050:1790..2194(+)	partial			WP_004138162.1	ABC transporter permease	100.0	50.6	100.0
MGA_912	LOCUS_08540	sequence051:7498..7644(-)	partial			WP_013399473.1	hypothetical protein	100.0	46.6	91.7
MGA_932	LOCUS_08700	sequence053:291..968(-)	partial			WP_009993974.1	type II CAAX endopeptidase family protein	100.0	68.2	100.0
MGA_951	LOCUS_08890	sequence054:12546..14030(+)	frameshift		14018,14068,14061	WP_013399592.1	beta-carotene 15,15'-monooxygenase	99.4	66.4	97.4
MGA_964	LOCUS_09020	sequence056:130..831(-)	frameshift		171,12	WP_162861121.1	hypothetical protein	94.4	72.6	99.5
MGA_965	LOCUS_09030	sequence056:1159..1968(-)	partial			WP_009993952.1	MFS transporter	100.0	62.6	97.8
MGA_972	LOCUS_09100	sequence057:1..736(+)	partial			WP_180947083.1	cell wall-binding protein	100.0	9.1	99.6
MGA_978	LOCUS_09160	sequence058:2619..3833(-)	partial			WP_009994308.1	hypothetical protein	45.3	74.1	34.0
MGA_981	LOCUS_09190	sequence058:6780..7745(+)	partial			WP_101886334.1	DUF6020 family protein	100.0	45.1	95.0
MGA_987	LOCUS_09250	sequence058:12006..13097(-)	frameshift		13104,13126	WP_004118365.1	NCS2 family permease	100.0	78.2	94.5
MGA_988	LOCUS_09260	sequence059:1..5616(+)	partial			WP_013399748.1	Rib/alpha-like domain-containing protein	100.0	61.1	94.7
MGA_1020	LOCUS_09540	sequence063:6853..7536(+)	internal_stop_codon	7534..7536(+)		WP_004111779.1	methylenetetrahydrofolate reductase [NAD(P)H]	100.0	79.9	100.0
MGA_1025	LOCUS_09580	sequence064:1..780(+)	partial			WP_004114086.1	sugar ABC transporter substrate-binding protein	100.0	59.0	100.0
MGA_1026	LOCUS_09590	sequence064:1414..1821(+)	partial			WP_013399353.1	sugar ABC transporter permease	100.0	43.5	91.9
MGA_1035	LOCUS_09660	sequence065:5231..6598(-)	partial			WP_009994308.1	hypothetical protein	8.4	15.6	71.1
MGA_1057	LOCUS_09840	sequence069:6472..>7835(-)	partial			WP_013399425.1	ABC transporter ATP-binding protein	100.0	71.8	97.8
MGA_1060	LOCUS_09870	sequence070:8745..11234(-)	internal_stop_codon	8745..8747(-)		WP_101886584.1	GA module-containing protein	90.1	40.3	66.3
MGA_1068	LOCUS_09950	sequence071:7774..>8327(-)	partial			WP_013399385.1	GntR family transcriptional regulator	100.0	69.1	100.0
MGA_1069	LOCUS_09960	sequence072:1..711(+)	partial			WP_004114399.1	sugar ABC transporter permease	100.0	73.5	97.5
MGA_1078	LOCUS_10040	sequence073:1..613(+)	partial			WP_004122184.1	M20 family metallopeptidase	100.0	49.6	100.0
MGA_1085	LOCUS_10110	sequence073:7528..8013(-)	frameshift		8089	WP_013399497.1	class C sortase	100.0	42.0	96.9
MGA_1089	LOCUS_10130	sequence074:1851..2132(-)	partial			WP_009993795.1	rhomboid family intramembrane serine protease	82.8	33.0	94.8
MGA_1110	LOCUS_10320	sequence076:8147..>8928(-)	partial			WP_004115494.1	preprotein translocase subunit SecA	100.0	28.1	98.8
MGA_1112	LOCUS_10340	sequence077:1519..1662(+)	partial			WP_004113042.1	hypothetical protein	59.6	59.6	100.0
MGA_1118	LOCUS_10400	sequence077:10839..11804(+)	partial			WP_013399731.1	folylpolyglutamate synthase/dihydrofolate synthase family protein	99.7	66.1	96.6
MGA_1125	LOCUS_10470	sequence078:10417..>10930(-)	partial			WP_013399621.1	ABC transporter ATP-binding protein	100.0	59.9	100.0
MGA_1132	LOCUS_10530	sequence079:6398..6745(-)	frameshift		6785	WP_004111773.1	dihydroorotate dehydrogenase	100.0	34.7	93.0
MGA_1133	LOCUS_10540	sequence079:6768..7394(-)	frameshift		6785	WP_004111773.1	dihydroorotate dehydrogenase	99.0	62.2	98.1
MGA_1136	LOCUS_10570	sequence080:2019..2219(+)	frameshift		2189	WP_013399530.1	InlB B-repeat-containing protein	87.9	8.0	91.4
MGA_1138	LOCUS_10590	sequence080:2594..4195(+)	partial			WP_013399530.1	InlB B-repeat-containing protein	100.0	73.5	91.9
MGA_1144	LOCUS_10650	sequence080:8517..8735(-)	partial			WP_004112566.1	hypothetical protein	100.0	53.3	98.6
MGA_1159	LOCUS_10770	sequence083:1..1664(+)	partial			WP_013399429.1	KUP/HAK/KT family potassium transporter	100.0	66.4	96.9
MGA_1166	LOCUS_10830	sequence084:1557..2222(-)	frameshift		1646	WP_013399495.1	hypothetical protein	86.9	79.0	100.0
MGA_1167	LOCUS_10840	sequence084:2259..7028(-)	internal_stop_codon	2259..2261(-)		WP_162862660.1	Rib/alpha-like domain-containing protein	99.0	83.6	43.7
MGA_1170	LOCUS_10870	sequence085:5613..5792(-)	frameshift		5636	WP_013399534.1	InlB B-repeat-containing protein	91.5	6.1	100.0
MGA_1188	LOCUS_11020	sequence087:8690..>9194(-)	partial			WP_004113201.1	2-keto-3-deoxygluconate permease	100.0	52.2	80.8
MGA_1189	LOCUS_11030	sequence088:1..1321(+)	partial			WP_013399537.1	bifunctional (p)ppGpp synthetase/guanosine-3',5'-bis(diphosphate) 3'-pyrophosphohydrolase	100.0	56.4	98.9
MGA_1191	LOCUS_11050	sequence088:2112..>3108(-)	partial			WP_013399538.1	phosphomethylpyrimidine synthase ThiC	100.0	37.6	100.0
MGA_1192	LOCUS_11060	sequence089:1..825(+)	partial			WP_161796623.1	alkaline phosphatase family protein	100.0	69.0	100.0
MGA_1199	LOCUS_11110	sequence090:2702..3370(+)	internal_stop_codon	3368..3370(+)		WP_004112605.1	formate C-acetyltransferase	100.0	28.1	98.6
MGA_1220	LOCUS_11250	sequence094:5072..>6435(-)	partial			WP_004575067.1	ATP-dependent zinc metalloprotease FtsH	100.0	60.3	97.8
MGA_1226	LOCUS_11300	sequence095:4135..>5403(-)	partial			WP_162861487.1	ATP-dependent chaperone ClpB	100.0	48.8	98.3
MGA_1228	LOCUS_11310	sequence096:851..>1778(-)	partial			WP_013399764.1	FAD-binding protein	100.0	72.1	100.0
MGA_1232	LOCUS_11340	sequence097:2698..>3613(-)	partial			WP_004573712.1	amino acid permease	100.0	56.7	93.1
MGA_1253	LOCUS_11510	sequence103:3992..>4823(-)	partial			WP_004112605.1	formate C-acetyltransferase	100.0	34.9	100.0
MGA_1255	LOCUS_11530	sequence104:2336..>4642(-)	partial			WP_013399740.1	DNA-directed RNA polymerase subunit beta'	97.7	56.0	100.0
MGA_1256	LOCUS_11540	sequence105:511..633(+)	partial			WP_014554495.1	nucleoside hydrolase	100.0	12.9	97.5
MGA_1266	LOCUS_11610	sequence107:4591..>5192(-)	partial			WP_013399756.1	substrate-binding domain-containing protein	100.0	57.7	98.0
MGA_1278	LOCUS_11720	sequence110:3365..3664(+)	partial			WP_004122184.1	M20 family metallopeptidase	88.9	21.5	100.0
MGA_1287	LOCUS_11780	sequence112:4584..4913(-)	partial			WP_004111656.1	UMP kinase	100.0	43.8	100.0
MGA_1290	LOCUS_11800	sequence113:1525..>2130(-)	partial			WP_013399323.1	F0F1 ATP synthase subunit alpha	100.0	36.3	100.0
MGA_1293	LOCUS_11820	sequence114:3327..3506(-)	partial			WP_116440418.1	type I-E CRISPR-associated endonuclease Cas1e	100.0	18.8	93.2
MGA_1294	LOCUS_11830	sequence115:1..658(+)	partial			WP_004118143.1	LacI family DNA-binding transcriptional regulator	100.0	64.5	97.7
MGA_1296	LOCUS_11850	sequence115:1729..>2757(-)	partial			WP_013399407.1	alpha-amylase family glycosyl hydrolase	99.7	60.0	100.0
MGA_1308	LOCUS_11940	sequence119:1..1129(+)	partial			WP_013399446.1	translation initiation factor IF-2	100.0	38.4	100.0
MGA_1310	LOCUS_11960	sequence119:1750..2760(+)	frameshift		2817,2887,2776,2795,2751	WP_013399447.1	tRNA pseudouridine(55) synthase TruB	99.4	83.5	93.4
MGA_1311	LOCUS_11970	sequence120:1..704(+)	partial			WP_013399648.1	bifunctional UDP-N-acetylglucosamine diphosphorylase/glucosamine-1-phosphate N-acetyltransferase GlmU	100.0	49.5	97.4
MGA_1323	LOCUS_12040	sequence124:1..534(+)	partial			WP_004137617.1	DNA recombination protein RmuC	100.0	39.7	100.0
MGA_1324	LOCUS_12050	sequence124:592..1125(+)	frameshift		1086	WP_004573630.1	hypothetical protein	93.2	58.5	100.0
MGA_1325	LOCUS_12060	sequence124:1139..1441(+)	frameshift		1086	WP_004573630.1	hypothetical protein	100.0	35.5	94.0
MGA_1332	LOCUS_12090	sequence127:809..1321(+)	partial			WP_013399773.1	NADP-dependent phosphogluconate dehydrogenase	100.0	35.0	94.7
MGA_1337	LOCUS_12110	sequence130:440..>1127(-)	partial			WP_004113351.1	CTP synthase	97.4	40.0	99.1
MGA_1340	LOCUS_12120	sequence132:1..662(+)	partial			WP_048730823.1	FGGY family carbohydrate kinase	100.0	44.3	100.0
MGA_1341	LOCUS_12130	sequence132:751..918(+)	frameshift		962,903,1001,988,972,943	WP_013399756.1	substrate-binding domain-containing protein	92.7	14.8	100.0
MGA_1344	LOCUS_12140	sequence133:1007..1180(+)	partial			WP_004114066.1	sn-glycerol-3-phosphate ABC transporter ATP-binding protein UgpC	77.2	11.7	100.0
MGA_1350	LOCUS_12160	sequence138:1..833(+)	frameshift		904,827,894	WP_180947083.1	cell wall-binding protein	100.0	10.3	94.2
MGA_1360	LOCUS_12200	sequence144:64..>799(-)	partial			WP_013399688.1	ATP-binding protein	100.0	60.7	100.0
MGA_1361	LOCUS_12210	sequence145:1..748(+)	partial			WP_004118145.1	extracellular solute-binding protein	100.0	65.2	82.4
