# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_7	LOCUS_00060	sequence001:4855..5055(-)	internal_stop_codon	5149..5151(-)		WP_000214765.1	AAA family ATPase	90.9	6.5	46.7
MGA_14	LOCUS_00130	sequence001:9922..10359(-)	partial			WP_002917164.1	type III-A CRISPR-associated protein Csm2	89.0	68.2	40.5
MGA_34	LOCUS_00320	sequence001:33437..33793(-)	internal_stop_codon	33917..33919(-)		WP_010922509.1	type I-C CRISPR-associated endonuclease Cas1c	97.5	33.7	59.1
MGA_35	LOCUS_00330	sequence001:33917..34459(-)	internal_stop_codon	33917..33919(-)		WP_010932802.1	type I-C CRISPR-associated endonuclease Cas1c	98.3	51.6	42.4
MGA_43	LOCUS_00410	sequence001:42817..43158(-)	frameshift		43392,43126,43151	WP_003813444.1	nitroreductase family protein	78.8	42.4	33.7
MGA_47	LOCUS_00450	sequence001:44809..44982(-)	partial			WP_011987099.1	methyl-accepting chemotaxis protein	89.5	8.9	58.8
MGA_68	LOCUS_00660	sequence001:72619..72906(-)	partial			WP_002303793.1	lipopolysaccharide assembly protein LapA domain-containing protein	87.4	56.5	36.1
MGA_104	LOCUS_01020	sequence001:104284..106425(-)	partial			WP_011101414.1	DNA translocase FtsK	72.1	51.2	63.8
MGA_128	LOCUS_01260	sequence001:128107..128433(-)	frameshift		128412,128583	WP_011100915.1	peptide ABC transporter substrate-binding protein	94.4	18.4	55.9
MGA_129	LOCUS_01270	sequence001:128384..128578(-)	frameshift		128416	WP_011254634.1	peptide ABC transporter substrate-binding protein	89.1	10.5	54.4
MGA_146	LOCUS_01440	sequence002:212..346(-)	partial			WP_011476585.1	RNA-guided endonuclease TnpB family protein	97.7	10.1	74.4
MGA_199	LOCUS_01970	sequence002:52665..53015(-)	partial			WP_010496068.1	hypothetical protein	75.9	74.6	38.6
MGA_218	LOCUS_02160	sequence002:71174..71359(+)	partial			WP_003694124.1	30S ribosomal protein S21	70.5	70.5	100.0
MGA_325	LOCUS_03230	sequence004:23745..23984(-)	partial			WP_003641297.1	hypothetical protein	94.9	70.9	35.5
MGA_356	LOCUS_03540	sequence005:43..1857(-)	partial			WP_010964394.1	hypothetical protein	75.3	13.8	28.5
MGA_366	LOCUS_03640	sequence005:13037..14194(-)	partial			WP_053240438.1	glycosyltransferase family 1 protein	47.5	43.8	27.5
MGA_396	LOCUS_03940	sequence005:44728..46251(-)	partial			WP_002286053.1	SpaH/EbpB family LPXTG-anchored major pilin	67.9	55.4	30.4
MGA_452	LOCUS_04500	sequence006:35524..36489(+)	partial			WP_010965544.1	alpha/beta hydrolase	82.9	73.8	34.3
MGA_456	LOCUS_04540	sequence006:40399..41151(+)	internal_stop_codon	41149..41151(+)		WP_012972561.1	IS110 family transposase	98.4	61.8	46.8
MGA_457	LOCUS_04550	sequence006:41170..41622(+)	internal_stop_codon	41149..41151(+)		WP_003549893.1	IS110 family transposase	98.0	35.8	59.9
MGA_458	LOCUS_04560	sequence006:41880..42941(+)	frameshift		43064,42869	WP_115276001.1	ISL3 family transposase	94.1	77.8	34.9
MGA_464	LOCUS_04620	sequence006:49768..51948(+)	partial			WP_003434402.1	ATP-dependent RecD-like DNA helicase	47.0	50.2	24.7
MGA_486	LOCUS_04830	sequence007:21716..22426(-)	internal_stop_codon	22430..22432(-)		WP_041272513.1	flagellin	96.2	70.4	32.7
MGA_487	LOCUS_04840	sequence007:22430..22774(-)	internal_stop_codon	22430..22432(-)		WP_011392281.1	flagellin	99.1	29.7	61.9
MGA_493	LOCUS_04900	sequence007:29137..29610(-)	partial			WP_003700642.1	ComF family protein	100.0	68.4	45.9
MGA_496	LOCUS_04930	sequence007:31980..32228(-)	frameshift,internal_stop_codon	32016..32018(-)	32024	WP_003703269.1	IS200/IS605 family transposase	82.9	47.6	63.2
MGA_542	LOCUS_05390	sequence008:33901..34320(+)	partial			WP_011476136.1	cell division protein SepF	75.5	74.7	47.3
MGA_549	LOCUS_05460	sequence008:41725..41892(+)	partial			WP_011475897.1	RNA-guided endonuclease TnpB family protein	78.2	10.1	67.4
MGA_563	LOCUS_05600	sequence009:5203..5490(-)	partial			WP_003098742.1	flagellar biosynthesis anti-sigma factor FlgM	78.9	70.1	33.3
MGA_574	LOCUS_05710	sequence009:14323..15594(-)	partial			WP_011462131.1	methyl-accepting chemotaxis protein	93.1	59.4	29.9
MGA_580	LOCUS_05770	sequence009:21008..22075(-)	internal_stop_codon	22097..22099(-)		WP_011986950.1	fused FliR family export protein/FlhB family type III secretion system protein	96.9	56.5	39.7
MGA_581	LOCUS_05780	sequence009:22097..22855(-)	internal_stop_codon	22097..22099(-)		WP_010965447.1	fused FliR family export protein/FlhB family type III secretion system protein	99.6	41.5	27.8
MGA_586	LOCUS_05830	sequence009:24945..25202(-)	partial			WP_005816224.1	flagellar FlbD family protein	65.9	74.7	48.2
MGA_588	LOCUS_05850	sequence009:26217..26570(-)	partial			WP_011986955.1	TIGR02530 family flagellar biosynthesis protein	82.1	71.2	44.4
MGA_596	LOCUS_05930	sequence009:32233..33633(-)	internal_stop_codon	32233..32235(-)		WP_010965461.1	flagellar basal-body MS-ring/collar protein FliF	94.4	84.9	34.0
MGA_597	LOCUS_05940	sequence009:33658..33972(-)	partial			WP_011986961.1	flagellar hook-basal body complex protein FliE	71.2	71.2	41.9
MGA_615	LOCUS_06120	sequence010:13399..13743(+)	partial			WP_003700554.1	preprotein translocase subunit YajC	75.4	68.3	55.8
MGA_638	LOCUS_06350	sequence010:34763..35014(+)	partial			WP_002295087.1	cell division protein ZapA	95.2	54.5	48.1
MGA_654	LOCUS_06510	sequence011:6238..7185(+)	partial			WP_004398990.1	inositol 2-dehydrogenase	75.2	73.0	24.2
MGA_694	LOCUS_06910	sequence012:10195..10443(-)	partial			WP_002287688.1	tyrosine-type recombinase/integrase	95.1	20.8	58.2
MGA_695	LOCUS_06920	sequence012:10896..11240(-)	internal_stop_codon	11292..11294(-)		WP_003703269.1	IS200/IS605 family transposase	89.5	71.3	72.5
MGA_702	LOCUS_06990	sequence012:20832..21773(+)	partial			WP_002369211.1	glycerophosphodiester phosphodiesterase	73.5	38.2	40.9
MGA_716	LOCUS_07130	sequence013:634..2922(+)	frameshift,internal_stop_codon	511..513(+)	519	WP_000200226.1	YfhO family protein	48.6	40.7	24.5
MGA_718	LOCUS_07150	sequence013:4031..4876(-)	partial			WP_225355332.1	6-pyruvoyl-tetrahydropterin synthase-related protein	95.4	45.2	24.9
MGA_723	LOCUS_07200	sequence013:11075..12187(-)	partial			WP_081581110.1	N-acetylmuramoyl-L-alanine amidase	55.4	19.4	58.7
MGA_743	LOCUS_07400	sequence013:33920..34279(+)	partial			WP_011476362.1	CrcB family protein	68.1	62.8	53.1
MGA_767	LOCUS_07640	sequence014:22029..22244(+)	partial			WP_011254133.1	RNA-guided endonuclease TnpB family protein	93.0	17.1	66.7
MGA_792	LOCUS_07890	sequence015:14251..15231(+)	partial			WP_010870531.1	phosphoglycerate dehydrogenase	82.2	50.6	33.3
MGA_801	LOCUS_07980	sequence015:23897..24445(-)	partial			WP_010868022.1	SagB/ThcOx family dehydrogenase	70.9	65.8	38.6
MGA_803	LOCUS_08000	sequence015:25569..25700(-)	frameshift		25708	WP_011254325.1	transporter substrate-binding domain-containing protein	95.3	14.3	65.9
MGA_804	LOCUS_08010	sequence015:25694..25882(-)	frameshift		25708	WP_011254325.1	transporter substrate-binding domain-containing protein	93.5	20.3	79.3
MGA_810	LOCUS_08070	sequence016:137..1567(-)	partial			WP_010905926.1	phage tail tape measure protein	98.1	27.7	34.7
MGA_842	LOCUS_08390	sequence016:19220..19993(-)	partial			WP_011860997.1	phage recombination protein Bet	61.1	52.0	51.9
MGA_867	LOCUS_08640	sequence017:8136..9062(-)	frameshift		9084	WP_011475733.1	competence protein CoiA family protein	77.9	78.6	42.9
MGA_884	LOCUS_08810	sequence017:26006..26401(-)	partial			WP_000227333.1	polymorphic toxin type 50 domain-containing protein	98.5	31.5	60.5
MGA_964	LOCUS_09600	sequence021:4732..5520(+)	partial			WP_011476109.1	hypothetical protein	77.5	68.1	34.5
MGA_1004	LOCUS_10000	sequence022:24569..24979(+)	frameshift		25104,24641,24947	WP_011254472.1	RNA-guided endonuclease TnpB family protein	71.3	27.0	58.7
MGA_1006	LOCUS_10020	sequence022:25428..25718(+)	frameshift		25338	WP_011254472.1	RNA-guided endonuclease TnpB family protein	99.0	24.7	70.5
MGA_1009	LOCUS_10050	sequence023:1306..2229(+)	partial			WP_011861238.1	IS200/IS605 family element RNA-guided endonuclease TnpB	80.5	62.6	24.0
MGA_1010	LOCUS_10060	sequence023:2612..2926(+)	frameshift		2899	WP_002286721.1	arginine-ornithine antiporter	91.3	20.5	53.6
MGA_1012	LOCUS_10080	sequence023:3533..3904(+)	partial			WP_007054380.1	acylphosphatase	52.8	67.0	49.2
MGA_1052	LOCUS_10480	sequence024:17412..17771(+)	internal_stop_codon	17256..17258(+)		WP_084742643.1	IS607-like element ISSto11 family transposase	74.8	48.9	39.3
MGA_1060	LOCUS_10550	sequence025:309..1553(-)	partial			WP_010957062.1	TIR domain-containing protein	38.9	42.0	37.1
MGA_1061	LOCUS_10560	sequence025:1694..2062(-)	frameshift,internal_stop_codon	2079..2081(-)	2054	WP_011166415.1	Eco47II family restriction endonuclease	88.5	40.2	42.0
MGA_1100	LOCUS_10950	sequence026:21531..21791(-)	partial			WP_061603534.1	HAD family hydrolase	90.7	27.9	57.7
MGA_1139	LOCUS_11340	sequence028:19650..20573(+)	partial			WP_011475863.1	DNA internalization-related competence protein ComEC/Rec2	81.1	33.2	58.8
MGA_1143	LOCUS_11380	sequence029:3109..4500(-)	partial			WP_002287386.1	NlpC/P60 family protein	24.8	22.1	69.0
MGA_1146	LOCUS_11410	sequence029:7867..8397(+)	partial			WP_003641616.1	signal peptidase I	81.8	73.8	40.0
MGA_1164	LOCUS_11590	sequence030:2357..3424(-)	partial			WP_011103073.1	restriction endonuclease subunit S	34.1	34.2	33.3
MGA_1178	LOCUS_11730	sequence030:18145..18783(-)	internal_stop_codon	18838..18840(-)		WP_003244282.1	class I SAM-dependent DNA methyltransferase	96.2	21.5	50.5
MGA_1179	LOCUS_11740	sequence030:18838..20832(-)	internal_stop_codon	18838..18840(-)		WP_003244282.1	class I SAM-dependent DNA methyltransferase	100.0	75.8	56.4
MGA_1182	LOCUS_11770	sequence031:3515..4072(-)	partial			WP_010931764.1	alanine--glyoxylate aminotransferase family protein	93.0	45.6	33.9
MGA_1185	LOCUS_11800	sequence031:7582..8904(-)	partial			WP_010880882.1	glycerol-3-phosphate cytidylyltransferase	28.0	72.6	52.8
MGA_1187	LOCUS_11820	sequence031:9770..11233(-)	partial			WP_015263274.1	hypothetical protein	82.8	49.5	30.2
MGA_1189	LOCUS_11840	sequence031:12357..13853(-)	partial			WP_015263274.1	hypothetical protein	84.5	50.8	33.3
MGA_1195	LOCUS_11900	sequence031:18433..20607(-)	partial			WP_009898508.1	glycosyltransferase family 2 protein	27.1	50.8	25.7
MGA_1198	LOCUS_11930	sequence032:3445..4197(-)	partial			WP_010905168.1	MATE family efflux transporter	96.4	54.5	23.4
MGA_1212	LOCUS_12070	sequence033:4218..5228(+)	partial			WP_000643829.1	GNAT family N-acetyltransferase	43.8	82.5	39.7
MGA_1213	LOCUS_12080	sequence033:5289..5480(+)	partial			WP_012027683.1	methylenetetrahydrofolate reductase [NAD(P)H]	50.8	11.2	65.6
MGA_1217	LOCUS_12120	sequence033:8420..9250(+)	frameshift		8402	WP_003437109.1	MATE family efflux transporter	97.1	59.8	44.5
MGA_1222	LOCUS_12170	sequence033:14469..14732(+)	frameshift		14745,14615	WP_009895475.1	NUDIX hydrolase	44.8	19.1	61.5
MGA_1223	LOCUS_12180	sequence033:14915..15727(+)	partial			WP_051532688.1	DUF3578 domain-containing protein	61.1	45.5	37.3
MGA_1224	LOCUS_12190	sequence033:15954..17114(+)	partial			WP_143185615.1	DUF262 domain-containing protein	62.2	54.1	23.3
MGA_1230	LOCUS_12250	sequence034:7566..9119(-)	partial			WP_011948347.1	ABC transporter ATP-binding protein	79.3	74.4	25.0
MGA_1232	LOCUS_12270	sequence034:10755..11801(-)	partial			WP_007056327.1	thiazole biosynthesis adenylyltransferase ThiF	30.2	39.0	40.0
MGA_1277	LOCUS_12700	sequence038:5891..6364(+)	partial			WP_100190734.1	IS3 family transposase	96.8	30.1	36.9
MGA_1283	LOCUS_12760	sequence038:13353..13787(-)	partial			WP_003722849.1	LytTR family DNA-binding domain-containing protein	73.6	70.2	45.3
MGA_1286	LOCUS_12790	sequence038:15912..16379(-)	internal_stop_codon	16407..16409(-)		WP_011476518.1	DUF308 domain-containing protein	91.6	81.6	51.4
MGA_1324	LOCUS_13170	sequence041:15261..15518(-)	frameshift		15550	WP_011102204.1	6-phospho-beta-glucosidase	96.5	17.0	65.1
MGA_1338	LOCUS_13310	sequence042:12711..15566(-)	partial			WP_081581110.1	N-acetylmuramoyl-L-alanine amidase	67.7	60.4	39.8
MGA_1350	LOCUS_13430	sequence043:13601..14020(-)	partial			WP_002670247.1	AraC family transcriptional regulator	65.5	28.9	34.1
MGA_1475	LOCUS_14680	sequence054:3277..3585(+)	partial			WP_011102117.1	amino acid permease	78.4	17.4	59.3
MGA_1476	LOCUS_14690	sequence054:3503..3907(+)	partial			WP_002263094.1	amino acid permease	92.5	26.7	31.5
MGA_1478	LOCUS_14710	sequence054:5237..6625(-)	partial			WP_003546132.1	bifunctional acetaldehyde-CoA/alcohol dehydrogenase	97.0	51.1	65.6
MGA_1496	LOCUS_14890	sequence055:9799..10089(-)	partial			WP_219718821.1	hypothetical protein	88.5	16.5	48.2
MGA_1503	LOCUS_14960	sequence056:3272..4249(-)	partial			WP_011948292.1	methyl-accepting chemotaxis protein	84.3	39.2	29.5
MGA_1504	LOCUS_14970	sequence056:4269..5297(-)	partial			WP_011083160.1	FIST N-terminal domain-containing protein	74.9	67.0	29.9
MGA_1534	LOCUS_15260	sequence059:2499..2954(+)	partial			WP_011475718.1	sigma-70 family RNA polymerase sigma factor	59.6	46.4	47.8
MGA_1554	LOCUS_15460	sequence061:8032..8481(+)	frameshift		8427	WP_003643171.1	ABC transporter substrate-binding protein	72.5	24.0	61.1
MGA_1555	LOCUS_15470	sequence061:8390..8833(+)	frameshift		8800,8427	WP_003643171.1	ABC transporter substrate-binding protein	83.0	27.1	54.9
MGA_1556	LOCUS_15480	sequence061:8836..9354(+)	frameshift		8800	WP_003643171.1	ABC transporter substrate-binding protein	98.3	37.6	47.9
MGA_1567	LOCUS_15590	sequence063:117..362(-)	partial			WP_011475670.1	hypothetical protein	77.8	58.3	42.9
MGA_1573	LOCUS_15650	sequence063:5807..9676(-)	partial			WP_010905926.1	phage tail tape measure protein	97.6	72.0	29.0
MGA_1610	LOCUS_16010	sequence068:1..589(+)	partial			WP_003700854.1	glycosyltransferase family 2 protein	100.0	63.0	79.1
MGA_1624	LOCUS_16150	sequence069:3033..3407(+)	frameshift		3401	WP_003429214.1	cysteine hydrolase family protein	98.4	70.5	63.1
MGA_1634	LOCUS_16240	sequence070:3780..4025(-)	frameshift		4048	WP_010890794.1	GNAT family N-acetyltransferase	100.0	59.1	35.8
MGA_1635	LOCUS_16250	sequence070:4034..4198(-)	frameshift		4048	WP_010890794.1	GNAT family N-acetyltransferase	88.9	35.0	50.0
MGA_1639	LOCUS_16290	sequence070:8055..8324(-)	frameshift		8322,8478	WP_140224180.1	ClbS/DfsB family four-helix bundle protein	100.0	52.2	54.3
MGA_1660	LOCUS_16500	sequence072:7957..>8755(-)	partial			WP_003644683.1	ATP phosphoribosyltransferase regulatory subunit	98.1	67.6	40.2
MGA_1665	LOCUS_16540	sequence073:6421..8313(+)	partial			WP_013230933.1	DEAD/DEAH box helicase	72.5	71.2	31.4
MGA_1672	LOCUS_16600	sequence074:6384..6728(+)	frameshift		6668	WP_010964116.1	phosphatidylcholine/phosphatidylserine synthase	72.8	40.5	48.2
MGA_1682	LOCUS_16700	sequence075:5825..6199(+)	internal_stop_codon	6197..6199(+)		WP_003703917.1	metallophosphoesterase family protein	98.4	60.7	59.8
MGA_1683	LOCUS_16710	sequence075:6206..6427(+)	internal_stop_codon	6197..6199(+)		WP_003703917.1	metallophosphoesterase family protein	100.0	36.3	53.4
MGA_1688	LOCUS_16760	sequence076:889..1845(+)	partial			WP_002263236.1	sensor histidine kinase	74.2	72.9	36.0
MGA_1697	LOCUS_16840	sequence077:808..1710(-)	frameshift		1704,1652	WP_011475746.1	competence type IV pilus assembly protein ComGB	90.3	76.2	49.6
MGA_1718	LOCUS_17050	sequence079:5567..5770(-)	partial			WP_137628160.1	helix-turn-helix transcriptional regulator	98.5	47.5	40.9
MGA_1755	LOCUS_17410	sequence084:2506..3333(-)	partial			WP_011476061.1	DUF805 domain-containing protein	51.6	40.2	29.4
MGA_1765	LOCUS_17500	sequence086:281..1021(-)	partial			WP_003082313.1	peptide cleavage/export ABC transporter	94.3	31.6	37.6
MGA_1767	LOCUS_17520	sequence086:3106..3738(-)	partial			WP_015613327.1	GHKL domain-containing protein	95.2	47.3	33.7
MGA_1770	LOCUS_17550	sequence086:4993..5472(+)	partial			WP_002263742.1	thioredoxin family protein	70.4	32.4	26.5
MGA_1787	LOCUS_17720	sequence089:4709..4963(+)	partial			WP_002262851.1	cardiolipin synthase	100.0	16.4	47.6
MGA_1814	LOCUS_17990	sequence096:78..308(+)	frameshift		60	WP_011987017.1	TPR domain-containing glycosyltransferase	98.7	15.9	44.0
MGA_1816	LOCUS_18010	sequence096:2124..2852(+)	partial			WP_011017006.1	sugar phosphate nucleotidyltransferase	93.8	41.9	35.2
MGA_1836	LOCUS_18180	sequence101:365..943(+)	frameshift		940	WP_011674398.1	YfhO family protein	92.7	19.2	33.7
MGA_1838	LOCUS_18200	sequence101:2930..>3566(-)	partial			WP_003700854.1	glycosyltransferase family 2 protein	72.0	48.9	82.2
MGA_1854	LOCUS_18310	sequence106:1..1161(+)	partial			WP_011254350.1	GH25 family lysozyme	59.1	59.4	36.6
MGA_1855	LOCUS_18320	sequence106:1263..1775(+)	partial			WP_003695998.1	DUF4065 domain-containing protein	72.4	60.9	28.7
MGA_1871	LOCUS_18460	sequence111:863..1531(-)	partial			WP_000359383.1	hypothetical protein	51.4	48.0	36.0
MGA_1890	LOCUS_18580	sequence119:660..1124(+)	partial			WP_003438111.1	gamma-glutamyl-gamma-aminobutyrate hydrolase family protein	84.4	53.9	45.5
MGA_1893	LOCUS_18600	sequence121:41..181(+)	frameshift		160	WP_003642100.1	DUF554 domain-containing protein	82.6	16.9	63.2
MGA_1894	LOCUS_18610	sequence121:172..711(+)	frameshift		160	WP_003242513.1	DUF554 domain-containing protein	97.2	76.0	63.8
MGA_1897	LOCUS_18640	sequence122:1..1121(+)	partial			WP_011254604.1	RNA-guided endonuclease TnpB family protein	59.4	74.7	55.4
MGA_1900	LOCUS_18650	sequence124:84..476(-)	internal_stop_codon	84..86(-)		WP_041272192.1	transposase	100.0	28.0	35.4
MGA_1908	LOCUS_18690	sequence128:202..462(+)	frameshift		408,492	WP_010989544.1	glycosyltransferase family 2 protein	75.6	10.5	49.3
MGA_1909	LOCUS_18700	sequence128:533..955(+)	frameshift		411,516	WP_011987017.1	TPR domain-containing glycosyltransferase	88.6	26.0	31.2
