# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_128	LOCUS_01280	sequence1:151483..152145(+)	partial			WP_005483608.1	site-specific integrase	99.5	57.9	84.9
MGA_168	LOCUS_01680	sequence1:199669..199887(+)	partial			WP_005460046.1	DUF2878 domain-containing protein	91.7	38.8	69.7
MGA_305	LOCUS_03050	sequence1:357433..357822(+)	partial			WP_001894072.1	translation initiation factor IF-3	100.0	70.5	84.5
MGA_329	LOCUS_03290	sequence1:381377..381901(+)	frameshift		381874	WP_005480702.1	nicotinate-nucleotide--dimethylbenzimidazole phosphoribosyltransferase	95.4	47.8	80.7
MGA_330	LOCUS_03300	sequence1:381891..382421(+)	frameshift		381874	WP_005480702.1	nicotinate-nucleotide--dimethylbenzimidazole phosphoribosyltransferase	100.0	50.7	79.5
MGA_379	LOCUS_03790	sequence1:431403..431807(-)	partial			WP_064255339.1	lysozyme inhibitor LprI family protein	64.9	63.3	30.7
MGA_439	LOCUS_04390	sequence1:499508..500377(+)	frameshift		500374	WP_010926026.1	arylsulfatase	90.7	60.0	48.9
MGA_440	LOCUS_04400	sequence1:500472..500948(+)	frameshift		500374	WP_010926625.1	arylsulfatase	88.0	29.7	40.7
MGA_441	LOCUS_04410	sequence1:501101..502360(+)	partial			WP_011706294.1	retention module-containing protein	64.7	7.5	31.3
MGA_442	LOCUS_04420	sequence1:502326..513242(+)	frameshift		502336,502339	WP_011706294.1	retention module-containing protein	84.0	84.1	25.4
MGA_487	LOCUS_04870	sequence1:566988..567350(-)	frameshift		567402	WP_005454971.1	DUF2760 domain-containing protein	100.0	57.1	97.5
MGA_488	LOCUS_04880	sequence1:567385..567621(-)	frameshift		567402	WP_005454971.1	DUF2760 domain-containing protein	44.9	16.7	85.7
MGA_607	LOCUS_06070	sequence1:690452..690664(-)	frameshift		690740	WP_005458262.1	cell division protein ZapC	100.0	38.9	81.4
MGA_608	LOCUS_06080	sequence1:690732..690995(-)	frameshift		690740	WP_005458262.1	cell division protein ZapC	98.9	47.8	94.2
MGA_636	LOCUS_06360	sequence1:728331..733271(-)	frameshift		733362	WP_011707240.1	retention module-containing protein	69.3	20.5	32.3
MGA_641	LOCUS_06410	sequence1:734768..735427(-)	frameshift,internal_stop_codon	735431..735433(-)	735440,734836	WP_016361986.1	Calx-beta domain-containing protein	85.4	6.1	30.7
MGA_642	LOCUS_06420	sequence1:735402..737315(-)	frameshift,internal_stop_codon	735431..735433(-)	735440,735425,737364	WP_016361986.1	Calx-beta domain-containing protein	98.6	20.2	29.6
MGA_643	LOCUS_06430	sequence1:737338..738837(-)	frameshift		737364	WP_016361986.1	Calx-beta domain-containing protein	96.4	15.5	30.3
MGA_644	LOCUS_06440	sequence1:738827..740902(-)	frameshift		738832	WP_011105887.1	Calx-beta domain-containing protein	100.0	30.3	39.5
MGA_647	LOCUS_06470	sequence1:743307..759344(-)	partial			WP_005477759.1	tandem-95 repeat protein	45.9	79.0	46.1
MGA_772	LOCUS_07720	sequence1:889780..891819(+)	partial			WP_003243926.1	para-nitrobenzyl esterase	33.3	45.2	37.4
MGA_796	LOCUS_07960	sequence1:910147..910647(+)	frameshift		910126	WP_000520332.1	MFS transporter	93.4	36.5	69.0
MGA_797	LOCUS_07970	sequence1:910605..910832(-)	partial			WP_011236150.1	IS200/IS605-like element ISAzo20 family transposase	96.0	50.0	66.7
MGA_798	LOCUS_07980	sequence1:910942..911637(-)	partial			WP_010973830.1	4'-phosphopantetheinyl transferase	77.9	74.4	37.9
MGA_813	LOCUS_08130	sequence1:932750..933487(-)	partial			WP_050298568.1	enterochelin esterase	95.9	53.7	45.5
MGA_819	LOCUS_08190	sequence1:939463..940905(+)	partial			WP_164929447.1	tetratricopeptide repeat protein	22.5	51.5	32.1
MGA_823	LOCUS_08230	sequence1:942829..943101(-)	internal_stop_codon	943144..943146(-)		WP_011706213.1	GNAT family N-acetyltransferase	98.9	55.3	56.2
MGA_830	LOCUS_08300	sequence1:946807..947766(-)	partial			WP_109282207.1	phosphotransferase	74.3	70.2	21.4
MGA_842	LOCUS_08420	sequence1:956765..957145(-)	partial			WP_004188671.1	DUF4087 domain-containing protein	83.3	72.8	39.3
MGA_848	LOCUS_08480	sequence1:960783..961517(-)	partial			WP_049188803.1	hypothetical protein	57.0	53.5	38.6
MGA_849	LOCUS_08490	sequence1:961663..962229(-)	partial			WP_000557907.1	5-methylcytosine-specific endonuclease McrA	55.9	37.5	41.9
MGA_854	LOCUS_08540	sequence1:966663..967076(-)	partial			WP_011405426.1	hypothetical protein	68.6	60.6	36.2
MGA_859	LOCUS_08590	sequence1:969560..970342(-)	frameshift		970359	WP_155767756.1	IS3 family transposase	99.2	71.4	42.3
MGA_862	LOCUS_08620	sequence1:971806..972657(-)	frameshift		972674	WP_155767756.1	IS3 family transposase	99.3	71.4	44.5
MGA_865	LOCUS_08650	sequence1:974079..974861(-)	frameshift		974878	WP_155767756.1	IS3 family transposase	99.2	71.4	42.7
MGA_901	LOCUS_09010	sequence1:1003357..1004178(-)	partial			WP_011263036.1	HNH endonuclease	60.1	40.5	42.7
MGA_905	LOCUS_09050	sequence1:1006711..1007493(-)	frameshift		1007510	WP_155767756.1	IS3 family transposase	99.2	71.4	42.3
MGA_929	LOCUS_09290	sequence1:1031348..1036135(-)	partial			WP_003113014.1	PAS domain S-box protein	41.9	48.3	28.7
MGA_952	LOCUS_09520	sequence1:1061374..1061673(-)	partial			WP_005457820.1	DUF882 domain-containing protein	100.0	54.4	90.9
MGA_1015	LOCUS_10150	sequence1:1140461..1141405(+)	partial			WP_000904079.1	type VI secretion system immunity protein TsiV2	39.5	50.4	31.2
MGA_1037	LOCUS_10370	sequence1:1164040..1164852(-)	partial			WP_010951317.1	TIGR02594 family protein	52.6	81.6	36.7
MGA_1038	LOCUS_10380	sequence1:1165277..1165498(+)	partial			WP_005457970.1	hypothetical protein	100.0	41.2	79.5
MGA_1049	LOCUS_10490	sequence1:1179009..1179923(+)	partial			WP_005457979.1	paraquat-inducible protein A	100.0	68.6	92.1
MGA_1100	LOCUS_11000	sequence1:1240372..1240752(+)	partial			WP_005482409.1	disulfide bond formation protein DsbB	100.0	70.8	87.3
MGA_1146	LOCUS_11460	sequence1:1290505..1292283(-)	partial			WP_013097383.1	phage tail protein	78.4	67.9	31.4
MGA_1231	LOCUS_12310	sequence1:1373247..1373516(-)	partial			WP_005460100.1	YbaN family protein	100.0	66.4	85.4
MGA_1253	LOCUS_12530	sequence1:1397617..1397880(+)	frameshift		1397458	WP_005457721.1	endonuclease SmrB	100.0	49.4	97.7
MGA_1256	LOCUS_12560	sequence1:1401761..1402015(+)	partial			WP_005457697.1	hypothetical protein	71.4	71.4	80.0
MGA_1403	LOCUS_14030	sequence1:1547904..1548203(-)	frameshift		1548376	WP_005456539.1	FAD:protein FMN transferase	100.0	29.6	96.0
MGA_1404	LOCUS_14040	sequence1:1548149..1548907(-)	frameshift		1548379	WP_005456539.1	FAD:protein FMN transferase	70.6	53.3	93.8
MGA_1459	LOCUS_14590	sequence1:1612106..1613101(-)	partial			WP_145647357.1	acetate kinase	90.6	64.8	40.8
MGA_1505	LOCUS_15050	sequence1:1666116..1667201(+)	frameshift		1665963	WP_005490383.1	peptidoglycan DD-metalloendopeptidase family protein	100.0	84.1	92.8
MGA_1540	LOCUS_15400	sequence1:1717514..1717909(-)	partial			WP_005490362.1	LpxL/LpxP family Kdo(2)-lipid IV(A) lauroyl/palmitoleoyl acyltransferase	100.0	42.4	93.1
MGA_1718	LOCUS_17160	sequence1:1915966..1920555(-)	partial			WP_005490538.1	hypothetical protein	21.0	22.0	59.1
MGA_1724	LOCUS_17220	sequence1:1923192..1923695(-)	partial			WP_139685680.1	type II secretion system protein	61.1	60.1	58.7
MGA_1805	LOCUS_17990	sequence1:2024419..2024970(-)	partial			WP_005464765.1	peptidylprolyl isomerase	78.7	74.6	96.5
MGA_1952	LOCUS_19390	sequence1:2199923..2200282(-)	internal_stop_codon	2199923..2199925(-)		WP_011263378.1	DNA repair protein RadC	88.2	66.9	68.6
MGA_1955	LOCUS_19420	sequence1:2205200..2206435(+)	partial			WP_209435792.1	restriction endonuclease subunit S	46.7	47.5	63.5
MGA_2195	LOCUS_21760	sequence1:2478696..2478899(-)	partial			WP_157032699.1	IS3 family transposase	100.0	16.6	73.1
MGA_2196	LOCUS_21770	sequence1:2479505..2479900(-)	frameshift		2479549	WP_089068031.1	IS3 family transposase	91.6	29.4	68.3
MGA_2238	LOCUS_22190	sequence1:2527129..2527671(-)	partial			WP_005459005.1	amidophosphoribosyltransferase	96.7	72.2	81.0
MGA_2252	LOCUS_22330	sequence1:2544203..2544385(-)	frameshift		2544253	WP_005379346.1	DNA-directed RNA polymerase subunit omega	75.0	50.0	100.0
MGA_2313	LOCUS_22940	sequence1:2606655..2607917(+)	partial			WP_002288207.1	glycosyltransferase family 2 protein	97.4	58.9	28.3
MGA_2315	LOCUS_22960	sequence1:2608839..2609846(-)	partial			WP_011793001.1	sugar transferase	78.2	58.5	44.7
MGA_2333	LOCUS_23140	sequence1:2629951..2630130(+)	partial			WP_003022494.1	GIY-YIG nuclease family protein	89.8	56.4	54.7
MGA_2559	LOCUS_25400	sequence1:2881055..2881924(+)	frameshift		2880900	WP_100069987.1	peptide chain release factor 2	98.3	77.8	91.2
MGA_2600	LOCUS_25810	sequence1:2926307..2926702(+)	frameshift		2926657	WP_089068031.1	IS3 family transposase	91.6	29.4	68.3
MGA_2601	LOCUS_25820	sequence1:2927308..2927511(+)	partial			WP_157032699.1	IS3 family transposase	100.0	16.6	73.1
MGA_2613	LOCUS_25920	sequence1:2943602..2943781(-)	partial			WP_005460170.1	YfhL family 4Fe-4S dicluster ferredoxin	100.0	70.2	93.2
MGA_2740	LOCUS_27190	sequence1:3084295..3084498(-)	partial			WP_157032699.1	IS3 family transposase	100.0	16.6	73.1
MGA_2741	LOCUS_27200	sequence1:3085104..3085499(-)	frameshift		3085148	WP_089068031.1	IS3 family transposase	91.6	29.4	68.3
MGA_2841	LOCUS_28200	sequence1:3195925..3196986(-)	partial			WP_011263703.1	cellulose biosynthesis protein BcsE	91.5	62.6	32.5
MGA_3015	LOCUS_29940	sequence2:51086..51868(+)	partial			WP_005478324.1	oligosaccharide flippase family protein	100.0	59.8	73.5
MGA_3035	LOCUS_30140	sequence2:73777..74169(+)	frameshift		74127	WP_089068031.1	IS3 family transposase	92.3	29.4	69.2
MGA_3036	LOCUS_30150	sequence2:74778..74981(+)	partial			WP_157032699.1	IS3 family transposase	100.0	16.6	73.1
MGA_3058	LOCUS_30370	sequence2:100886..102652(+)	frameshift		102598	WP_011106517.1	VWA domain-containing protein	75.7	72.0	77.8
MGA_3059	LOCUS_30380	sequence2:102649..102834(+)	frameshift		102598	WP_011106517.1	VWA domain-containing protein	62.3	6.1	86.8
MGA_3080	LOCUS_30590	sequence2:129331..130386(+)	partial			WP_005462928.1	transposase	100.0	71.8	94.0
MGA_3086	LOCUS_30650	sequence2:136250..136840(+)	frameshift,internal_stop_codon	136784..136786(+)	136777,136786	WP_005478313.1	DUF3744 domain-containing protein	91.8	31.1	96.1
MGA_3087	LOCUS_30660	sequence2:136897..137988(+)	frameshift,internal_stop_codon	136784..136786(+)	136777,136789	WP_005478313.1	DUF3744 domain-containing protein	100.0	62.7	97.2
MGA_3132	LOCUS_31110	sequence2:188394..189134(+)	frameshift		189047	WP_005462828.1	LysR substrate-binding domain-containing protein	88.6	73.6	83.9
MGA_3226	LOCUS_32050	sequence2:290071..290340(+)	partial			WP_005480121.1	hypothetical protein	100.0	63.1	70.8
MGA_3254	LOCUS_32330	sequence2:324905..325468(+)	frameshift,internal_stop_codon	325359..325361(+),325459..325461(+)	325442,325348	WP_049769589.1	TRAP transporter large permease subunit	81.3	25.1	29.1
MGA_3255	LOCUS_32340	sequence2:325465..326745(+)	partial			WP_011459065.1	TRAP transporter large permease subunit	96.2	65.7	46.1
MGA_3256	LOCUS_32350	sequence2:327259..328233(+)	partial			WP_011860914.1	ester cyclase	97.8	68.0	33.4
MGA_3333	LOCUS_33120	sequence2:421015..421671(-)	partial			WP_005464837.1	LysR family transcriptional regulator	100.0	71.9	95.0
MGA_3347	LOCUS_33260	sequence2:439564..439701(+)	frameshift		439528	WP_005477463.1	DUF3283 family protein	100.0	65.2	91.1
MGA_3427	LOCUS_34060	sequence2:515736..516263(+)	internal_stop_codon	515622..515624(+)		WP_011106217.1	prepilin-type N-terminal cleavage/methylation domain-containing protein	100.0	74.8	93.7
MGA_3449	LOCUS_34260	sequence2:540510..540965(+)	frameshift		540950	WP_011261945.1	hypothetical protein	98.0	43.1	72.3
MGA_3450	LOCUS_34270	sequence2:540965..541270(+)	frameshift,internal_stop_codon	541281..541283(+)	541265,540953	WP_011261945.1	hypothetical protein	98.0	28.9	67.7
MGA_3468	LOCUS_34450	sequence2:557308..557535(+)	partial			WP_005479615.1	hypothetical protein	100.0	70.8	85.3
MGA_3491	LOCUS_34680	sequence2:585144..585926(-)	partial			WP_005459327.1	GGDEF domain-containing protein	100.0	64.7	66.9
MGA_3590	LOCUS_35660	sequence2:685444..686163(-)	partial			WP_000753659.1	HTH-type transcriptional regulator EutR	90.8	66.6	30.9
MGA_3591	LOCUS_35670	sequence2:686579..687127(+)	frameshift		687010	WP_011103255.1	ethanolamine ammonia-lyase subunit EutB	80.8	31.7	60.5
MGA_3592	LOCUS_35680	sequence2:687127..687990(+)	frameshift		687010	WP_003093232.1	ethanolamine ammonia-lyase subunit EutB	97.6	60.6	69.8
MGA_3631	LOCUS_36070	sequence2:724336..725868(+)	frameshift		725856	WP_005479898.1	efflux RND transporter permease subunit	99.4	48.2	95.7
MGA_3632	LOCUS_36080	sequence2:725919..727493(+)	frameshift		725856	WP_005479898.1	efflux RND transporter permease subunit	100.0	49.8	91.0
MGA_3736	LOCUS_37120	sequence2:840394..841395(+)	partial			WP_014206790.1	AraC family transcriptional regulator	47.4	46.6	28.8
MGA_3741	LOCUS_37170	sequence2:844791..846113(+)	partial			WP_003113589.1	sensor histidine kinase ParS	64.1	65.7	32.2
MGA_3757	LOCUS_37330	sequence2:861191..861376(+)	partial			WP_005463466.1	GIY-YIG nuclease family protein	93.4	53.8	71.9
MGA_3819	LOCUS_37950	sequence2:928236..929531(-)	partial			WP_010906161.1	linear amide C-N hydrolase	69.1	71.8	26.4
MGA_3821	LOCUS_37970	sequence2:930411..932114(-)	partial			WP_011071841.1	FAD-binding protein	86.6	58.7	41.6
MGA_3823	LOCUS_37990	sequence2:932994..935126(-)	partial			WP_001066611.1	adenylate/guanylate cyclase domain-containing protein	46.8	24.4	21.0
MGA_3825	LOCUS_38010	sequence2:937036..938334(+)	partial			WP_011070576.1	phytanoyl-CoA dioxygenase family protein	39.8	25.4	33.0
MGA_3826	LOCUS_38020	sequence2:938327..939289(+)	partial			WP_004081384.1	methionyl-tRNA formyltransferase	58.4	58.1	25.7
MGA_3828	LOCUS_38040	sequence2:940170..941654(+)	frameshift		941651,941636,941645,941639	WP_001237656.1	Ig-like domain repeat protein	89.9	12.4	28.5
MGA_3831	LOCUS_38070	sequence2:950313..951140(-)	partial			WP_013224276.1	PLP-dependent aminotransferase family protein	97.8	57.7	36.5
MGA_3862	LOCUS_38380	sequence2:1005524..1006981(+)	partial			WP_005493834.1	DUF4150 domain-containing protein	94.4	62.7	46.5
MGA_3872	LOCUS_38480	sequence2:1016071..1016262(+)	partial			WP_000712921.1	hypothetical protein	52.4	50.8	69.7
MGA_3971	LOCUS_39470	sequence2:1142793..1143173(-)	frameshift		1143192	WP_021451094.1	fatty acid cis/trans isomerase	100.0	16.1	92.9
MGA_3972	LOCUS_39480	sequence2:1143154..1145148(-)	frameshift		1143195	WP_021451094.1	fatty acid cis/trans isomerase	98.2	83.2	91.3
MGA_4045	LOCUS_40210	sequence2:1223825..1224037(+)	partial			WP_005478461.1	beta-eliminating lyase-related protein	100.0	19.6	91.4
MGA_4050	LOCUS_40260	sequence2:1226721..1227419(-)	partial			WP_010972330.1	DMT family transporter	93.5	71.9	26.1
MGA_4053	LOCUS_40290	sequence2:1228886..1229725(+)	partial			WP_209238565.1	MBL fold metallo-hydrolase	86.7	68.6	31.2
MGA_4064	LOCUS_40400	sequence2:1244039..1244749(+)	partial			WP_011262030.1	hypothetical protein	42.8	70.0	46.7
MGA_4088	LOCUS_40640	sequence2:1273430..1274131(+)	frameshift		1274110	WP_005479127.1	DEAD/DEAH box helicase	97.4	54.4	88.1
MGA_4089	LOCUS_40650	sequence2:1274125..1274688(+)	frameshift		1274110	WP_005479127.1	DEAD/DEAH box helicase	98.4	44.1	89.7
MGA_4119	LOCUS_40950	sequence2:1305623..1306120(-)	frameshift		1306191	WP_005455373.1	arylesterase	100.0	82.5	90.3
MGA_4128	LOCUS_41040	sequence2:1317247..1318170(-)	frameshift		1318370	WP_055063916.1	TonB-dependent hemoglobin/transferrin/lactoferrin family receptor	100.0	44.0	52.1
MGA_4129	LOCUS_41050	sequence2:1318326..1319384(-)	frameshift		1318373	WP_005480856.1	TonB-dependent hemoglobin/transferrin/lactoferrin family receptor	89.8	44.3	58.9
MGA_4147	LOCUS_41230	sequence2:1333042..1334382(+)	partial			WP_011391484.1	P-loop NTPase fold protein	59.6	62.6	35.9
MGA_4174	LOCUS_41500	sequence2:1356021..1356704(-)	partial			WP_005460890.1	RimK/LysX family protein	67.4	67.4	87.6
MGA_4194	LOCUS_41700	sequence2:1377889..1378797(+)	frameshift		1378713	WP_005486302.1	signal transduction histidine-protein kinase/phosphatase UhpB	91.4	55.2	95.7
MGA_4195	LOCUS_41710	sequence2:1378761..1379390(+)	frameshift		1378716	WP_005486302.1	signal transduction histidine-protein kinase/phosphatase UhpB	100.0	41.8	96.2
MGA_4293	LOCUS_42690	sequence2:1493397..1493600(-)	partial			WP_157032699.1	IS3 family transposase	100.0	16.6	73.1
MGA_4294	LOCUS_42700	sequence2:1494209..1494601(-)	frameshift		1494250	WP_089068031.1	IS3 family transposase	92.3	29.4	68.3
MGA_4306	LOCUS_42820	sequence2:1507189..1509354(+)	partial			WP_002209275.1	heparinase II/III family protein	53.8	51.8	26.3
MGA_4367	LOCUS_43430	sequence2:1580305..1581198(-)	partial			WP_012259506.1	alpha/beta fold hydrolase	98.0	62.4	28.4
MGA_4385	LOCUS_43610	sequence2:1598317..1599075(-)	frameshift		1599149	WP_011262762.1	GTP-binding protein	99.2	73.2	64.8
MGA_4397	LOCUS_43730	sequence2:1611218..1611553(+)	frameshift		1611798	WP_021821499.1	bifunctional diguanylate cyclase/phosphodiesterase	96.4	20.9	83.2
MGA_4442	LOCUS_44180	sequence2:1662311..1670401(-)	frameshift		1670360,1670363,1670381,1670366	WP_005477759.1	tandem-95 repeat protein	80.5	67.2	26.2
MGA_4443	LOCUS_44190	sequence2:1670352..1681172(-)	frameshift		1670369,1671554,1670381,1681332,1671572,1670359,1670360,1681341	WP_005477759.1	tandem-95 repeat protein	69.9	79.9	25.7
MGA_4444	LOCUS_44200	sequence2:1681330..1682712(-)	frameshift,internal_stop_codon	1681341..1681343(-)	1681356,1681326,1681362,1681332,1681338,1681308,1681341	WP_005477759.1	tandem-95 repeat protein	62.0	8.6	34.6
MGA_4447	LOCUS_44230	sequence2:1684626..1686857(+)	partial			WP_011262974.1	sensor histidine kinase HahK	16.7	21.4	39.8
MGA_4450	LOCUS_44260	sequence2:1689829..1691967(+)	partial			WP_011074382.1	peptidase domain-containing ABC transporter	73.9	72.4	22.7
MGA_4465	LOCUS_44410	sequence2:1702639..1703349(-)	frameshift		1702680	WP_011106290.1	SURF1 family protein	95.8	81.3	68.6
MGA_4550	LOCUS_45260	sequence2:1793691..1795217(-)	partial			WP_033929385.1	methyl-accepting chemotaxis protein	76.0	60.3	39.5
MGA_4563	LOCUS_45390	sequence2:1808164..1809012(-)	frameshift		1809047	WP_015064447.1	ABC transporter ATP-binding protein	83.0	42.6	44.1
MGA_4564	LOCUS_45400	sequence2:1809033..1809920(-)	frameshift		1809035	WP_010972717.1	ABC transporter ATP-binding protein	84.1	46.7	38.7
