# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_6	LOCUS_00050	sequence1:7576..7860(+)	internal_stop_codon	7549..7551(+)		WP_001261062.1	Hsp20 family protein	98.9	64.1	86.0
MGA_74	LOCUS_00720	sequence1:89900..90430(-)	frameshift		90602	WP_032468650.1	ComF family protein	98.9	60.8	62.6
MGA_97	LOCUS_00950	sequence1:122677..122997(-)	partial			WP_011072286.1	IS630-like element ISSod10 family transposase	56.6	17.6	55.0
MGA_110	LOCUS_01080	sequence1:135627..136655(-)	partial			WP_001884305.1	COG3650 family protein	99.4	66.5	56.4
MGA_138	LOCUS_01360	sequence1:162529..163041(-)	internal_stop_codon	163141..163143(-)		WP_011073833.1	IS4-like element ISSod7 family transposase	96.5	37.5	53.6
MGA_139	LOCUS_01370	sequence1:163141..163857(-)	internal_stop_codon	163141..163143(-)		WP_011815285.1	IS4 family transposase	99.6	53.4	51.5
MGA_143	LOCUS_01410	sequence1:165422..166273(+)	partial			WP_011105416.1	IS66-like element ISPsy5 family transposase	98.9	54.9	46.9
MGA_144	LOCUS_01420	sequence1:166518..167471(-)	partial			WP_001229103.1	glycine betaine transporter OpuD	95.0	59.1	30.4
MGA_268	LOCUS_02650	sequence1:330037..330624(-)	frameshift		330764	WP_000195227.1	TRAP transporter permease	96.9	22.1	69.8
MGA_269	LOCUS_02660	sequence1:330624..332609(-)	frameshift		330764	WP_011261091.1	TRAP transporter permease	93.5	72.2	82.4
MGA_313	LOCUS_03100	sequence1:375406..376671(+)	partial			WP_015038871.1	SIR2 family protein	53.2	48.2	32.2
MGA_314	LOCUS_03110	sequence1:376668..378503(+)	partial			WP_011084726.1	DUF87 domain-containing protein	30.4	27.9	33.2
MGA_315	LOCUS_03120	sequence1:378678..378854(-)	partial			WP_000004192.1	AbrB family transcriptional regulator	94.8	15.9	90.9
MGA_353	LOCUS_03500	sequence1:420238..421254(-)	partial			WP_011964051.1	SMEK domain-containing protein	67.2	66.0	23.3
MGA_424	LOCUS_04210	sequence1:497498..498568(+)	partial			WP_168317624.1	HNH endonuclease	31.7	36.5	33.6
MGA_639	LOCUS_06350	sequence1:759469..759702(+)	partial			WP_005455950.1	DUF3622 domain-containing protein	79.2	61.0	68.9
MGA_651	LOCUS_06470	sequence1:767087..767305(+)	partial			WP_001160170.1	YqcC family protein	97.2	67.0	52.9
MGA_673	LOCUS_06690	sequence1:790103..790447(+)	partial			WP_011261420.1	MliC family protein	66.7	68.8	36.8
MGA_694	LOCUS_06900	sequence1:818868..819809(-)	partial			WP_000947937.1	O-antigen ligase	99.0	70.8	72.3
MGA_771	LOCUS_07670	sequence1:904985..905692(-)	partial			WP_162811139.1	4'-phosphopantetheinyl transferase	68.9	68.4	33.5
MGA_786	LOCUS_07820	sequence1:931010..932005(+)	frameshift		931885	WP_011106455.1	S-type pyocin domain-containing protein	70.4	26.0	54.5
MGA_787	LOCUS_07830	sequence1:932032..933105(+)	partial			WP_013096824.1	S-type pyocin domain-containing protein	91.6	58.4	32.2
MGA_789	LOCUS_07850	sequence1:933642..933836(+)	partial			WP_000122383.1	ribonuclease HI	93.8	38.4	51.7
MGA_796	LOCUS_07920	sequence1:937642..938493(+)	partial			WP_011104442.1	IS66 family transposase	97.5	55.7	45.8
MGA_802	LOCUS_07980	sequence1:944397..944576(-)	frameshift		944592	WP_001279784.1	putative transporter	62.7	6.7	70.3
MGA_804	LOCUS_08000	sequence1:945707..949528(-)	partial			WP_011390114.1	PAS domain S-box protein	64.3	52.6	38.2
MGA_840	LOCUS_08360	sequence1:991664..992083(-)	partial			WP_005482409.1	disulfide bond formation protein DsbB	93.5	73.0	79.2
MGA_879	LOCUS_08750	sequence1:1041555..1041728(-)	partial			WP_001247218.1	tyrosine-type recombinase/integrase	77.2	14.1	56.8
MGA_880	LOCUS_08760	sequence1:1041719..1042108(-)	partial			WP_000290950.1	tyrosine-type recombinase/integrase	90.7	32.6	51.3
MGA_888	LOCUS_08840	sequence1:1048310..1048633(+)	internal_stop_codon	1048244..1048246(+)		WP_001249011.1	methyl-accepting chemotaxis protein	98.1	16.4	53.4
MGA_918	LOCUS_09140	sequence1:1076598..1076777(+)	frameshift		1076765	WP_000002768.1	tyrosine-type recombinase/integrase	94.9	13.6	78.6
MGA_919	LOCUS_09150	sequence1:1077217..1077990(-)	partial			WP_011707494.1	hypothetical protein	62.6	55.1	27.6
MGA_933	LOCUS_09290	sequence1:1097958..1098212(-)	partial			WP_001259524.1	YnjH family protein	71.4	62.4	61.7
MGA_934	LOCUS_09300	sequence1:1098241..1098711(-)	frameshift		1098779	WP_021450949.1	1-aminocyclopropane-1-carboxylate deaminase/D-cysteine desulfhydrase	100.0	52.3	69.9
MGA_935	LOCUS_09310	sequence1:1098738..1099133(-)	frameshift		1098794	WP_000909262.1	1-aminocyclopropane-1-carboxylate deaminase/D-cysteine desulfhydrase	92.4	39.9	60.3
MGA_980	LOCUS_09760	sequence1:1150990..1163676(+)	partial			WP_172625977.1	MARTX multifunctional-autoprocessing repeats-in-toxin holotoxin RtxA	43.6	40.9	80.3
MGA_1042	LOCUS_10380	sequence1:1232131..1232706(-)	partial			WP_005477075.1	hypothetical protein	49.2	62.7	42.6
MGA_1047	LOCUS_10430	sequence1:1237973..1242739(+)	partial			WP_110731829.1	anthrax toxin-like adenylyl cyclase domain-containing protein	30.2	17.3	31.7
MGA_1130	LOCUS_11260	sequence1:1337568..1347275(+)	partial			WP_011707240.1	retention module-containing protein	91.0	56.3	53.9
MGA_1192	LOCUS_11880	sequence1:1415864..1416385(+)	partial			WP_000561940.1	bifunctional molybdopterin-guanine dinucleotide biosynthesis adaptor protein MobB/molybdopterin molybdotransferase MoeA	97.1	27.7	80.4
MGA_1197	LOCUS_11930	sequence1:1419665..1420168(+)	partial			WP_000958712.1	NlpC/P60 family protein	69.5	69.9	75.0
MGA_1268	LOCUS_12640	sequence1:1503386..1504585(+)	partial			WP_005458327.1	endonuclease	91.2	68.0	69.7
MGA_1277	LOCUS_12730	sequence1:1512217..1513836(-)	partial			WP_011266628.1	methyl-accepting chemotaxis protein	70.7	71.1	53.1
MGA_1286	LOCUS_12820	sequence1:1525144..1525662(-)	frameshift		1525676	WP_005458059.1	BCCT family transporter	97.7	32.1	80.4
MGA_1287	LOCUS_12830	sequence1:1525599..1526720(-)	frameshift		1525679	WP_005458059.1	BCCT family transporter	93.0	66.3	84.7
MGA_1312	LOCUS_13080	sequence1:1550477..1552015(-)	partial			WP_011104387.1	methyl-accepting chemotaxis protein	81.1	65.9	28.9
MGA_1333	LOCUS_13290	sequence1:1574943..1576043(-)	partial			WP_011229139.1	type III-B CRISPR module RAMP protein Cmr6	57.9	62.9	34.2
MGA_1367	LOCUS_13630	sequence1:1609926..1612568(-)	partial			WP_011106489.1	hypothetical protein	48.5	28.1	25.3
MGA_1381	LOCUS_13770	sequence1:1624798..1625427(-)	partial			WP_005463204.1	winged helix-turn-helix domain-containing protein	50.2	58.5	59.8
MGA_1415	LOCUS_14110	sequence1:1666584..1667087(-)	frameshift		1667037	WP_001142855.1	NADP-dependent isocitrate dehydrogenase	88.6	20.0	83.8
MGA_1416	LOCUS_14120	sequence1:1667023..1667589(-)	frameshift		1667858,1667037,1667551	WP_005481838.1	NADP-dependent isocitrate dehydrogenase	94.7	24.0	84.8
MGA_1417	LOCUS_14130	sequence1:1667531..1667863(-)	frameshift		1667889,1667858,1667551	WP_005481838.1	NADP-dependent isocitrate dehydrogenase	94.5	14.0	91.3
MGA_1418	LOCUS_14140	sequence1:1667860..1668294(-)	frameshift		1668401,1667858,1668277,1667889	WP_005481838.1	NADP-dependent isocitrate dehydrogenase	88.9	17.3	80.5
MGA_1419	LOCUS_14150	sequence1:1668390..1668815(-)	frameshift		1668404,1668277	WP_001142855.1	NADP-dependent isocitrate dehydrogenase	97.9	18.6	89.1
MGA_1523	LOCUS_15190	sequence1:1788627..1789826(-)	partial			WP_011727550.1	SIR2 family protein	60.4	41.2	27.1
MGA_1564	LOCUS_15600	sequence1:1830077..1830526(-)	frameshift		1830536	WP_005479533.1	NAD(P)H nitroreductase	99.3	81.3	74.3
MGA_1612	LOCUS_16080	sequence1:1885948..1886334(+)	partial			WP_001055412.1	rhombosortase	97.7	68.3	64.0
MGA_1638	LOCUS_16340	sequence1:1915082..1915729(+)	partial			WP_000219805.1	DMT family transporter	99.5	73.5	72.0
MGA_1671	LOCUS_16670	sequence1:1948878..1949723(-)	frameshift		1949724	WP_000119661.1	chemotaxis protein CheA	100.0	35.8	90.4
MGA_1672	LOCUS_16680	sequence1:1949704..1951176(-)	frameshift		1949727	WP_000119661.1	chemotaxis protein CheA	99.0	64.3	60.8
MGA_1902	LOCUS_18980	sequence1:2194284..2194583(+)	partial			WP_005482297.1	YebG family protein	73.7	74.5	91.8
MGA_2166	LOCUS_21610	sequence1:2492031..2496203(-)	partial			WP_022819412.1	hemagglutinin repeat-containing protein	36.5	18.2	22.0
MGA_2167	LOCUS_21620	sequence1:2496215..2498668(-)	partial			WP_050298438.1	contact-dependent inhibition toxin CdiA	45.0	20.0	22.1
MGA_2289	LOCUS_22840	sequence1:2640764..2641408(+)	partial			WP_005480156.1	M20 family metallopeptidase	100.0	57.2	90.7
MGA_2294	LOCUS_22890	sequence1:2646955..2647998(-)	partial			WP_012257167.1	glycosyltransferase family 1 protein	82.4	73.8	32.4
MGA_2299	LOCUS_22940	sequence1:2652121..2652750(-)	partial			WP_157798770.1	CatB-related O-acetyltransferase	75.1	73.7	26.6
MGA_2321	LOCUS_23160	sequence1:2672578..2672793(-)	partial			WP_014966182.1	ISAs1-like element ISEc1 family transposase	74.6	18.8	43.7
MGA_2343	LOCUS_23380	sequence1:2697158..2697874(+)	partial			WP_000146565.1	CatB-related O-acetyltransferase	70.6	79.7	50.3
MGA_2380	LOCUS_23750	sequence1:2733613..2735613(-)	partial			WP_011459237.1	restriction endonuclease-like protein	64.7	47.8	25.9
MGA_2383	LOCUS_23780	sequence1:2740060..2740377(-)	partial			WP_011389728.1	helix-turn-helix transcriptional regulator	76.2	65.6	36.6
MGA_2385	LOCUS_23800	sequence1:2742581..2745469(-)	partial			WP_005479039.1	Ig-like domain-containing protein	55.5	60.3	27.4
MGA_2449	LOCUS_24440	sequence1:2824678..2825109(-)	partial			WP_005478648.1	hypothetical protein	35.7	26.8	70.6
MGA_2494	LOCUS_24860	sequence2:341..490(+)	frameshift		488,335	WP_005464845.1	type I secretion system permease/ATPase	100.0	7.0	95.9
MGA_2495	LOCUS_24870	sequence2:597..983(+)	frameshift		488,335	WP_001154355.1	type I secretion system permease/ATPase	100.0	18.2	89.1
MGA_2496	LOCUS_24880	sequence2:1065..1241(-)	frameshift		1283,1256,1331	WP_000265356.1	FapA family protein	89.7	9.4	67.3
MGA_2497	LOCUS_24890	sequence2:1287..2132(-)	frameshift		2401,1281,2275,2161,1329,1254	WP_000265356.1	FapA family protein	94.0	47.5	76.1
MGA_2498	LOCUS_24900	sequence2:2455..2727(-)	frameshift		2544,2280,2400	WP_005464872.1	FapA family protein	73.3	11.8	47.0
MGA_2500	LOCUS_24920	sequence2:3251..4615(-)	frameshift		3112,3025,3331	WP_000634466.1	SpoIIE family protein phosphatase	93.4	75.2	71.5
MGA_2501	LOCUS_24930	sequence2:4714..4932(-)	frameshift		4731	WP_000110728.1	STAS domain-containing protein	95.8	69.7	72.5
MGA_2503	LOCUS_24950	sequence2:6166..6843(-)	frameshift		6861,7074,7005	WP_011037036.1	chemotaxis response regulator protein-glutamate methylesterase	95.1	61.5	47.5
MGA_2504	LOCUS_24960	sequence2:6840..6995(-)	frameshift		7074,7005,7141,6879	WP_013097812.1	chemotaxis response regulator protein-glutamate methylesterase	88.2	13.4	62.5
MGA_2506	LOCUS_24980	sequence2:9657..9818(-)	frameshift,internal_stop_codon	9634..9636(-)	9474,10083,9639,10059,9612,9549,9711,9648,9456,10098,9363,9558,9879,9528,9819	WP_000896388.1	methyl-accepting chemotaxis protein	90.6	7.2	63.3
MGA_2507	LOCUS_24990	sequence2:10255..10602(-)	frameshift		10080,10293,10182,10184,10296,10299,10059,10095	WP_000896388.1	methyl-accepting chemotaxis protein	87.8	15.9	64.8
MGA_2553	LOCUS_25450	sequence2:54103..54411(+)	partial			WP_001069570.1	VirK/YbjX family protein	80.4	26.8	45.1
MGA_2554	LOCUS_25460	sequence2:54408..54818(+)	partial			WP_001069570.1	VirK/YbjX family protein	90.4	40.2	51.2
MGA_2615	LOCUS_26070	sequence2:127243..127455(+)	frameshift,internal_stop_codon	127201..127203(+)	127193	WP_001131708.1	alkaline phosphatase family protein	92.9	7.0	53.8
MGA_2643	LOCUS_26350	sequence2:158532..158783(+)	partial			WP_005462960.1	phosphate ABC transporter ATP-binding protein PstB	92.8	30.9	89.6
MGA_2671	LOCUS_26630	sequence2:186790..187050(-)	partial			WP_005462828.1	LysR substrate-binding domain-containing protein	73.3	21.3	68.3
MGA_2686	LOCUS_26780	sequence2:202831..203517(-)	partial			WP_005479818.1	DMT family transporter	54.8	41.4	81.6
MGA_2694	LOCUS_26860	sequence2:212177..212356(+)	partial			WP_000793856.1	peptidase T	86.4	12.4	70.6
MGA_2710	LOCUS_27020	sequence2:226720..228234(+)	partial			WP_048064848.1	AAA family ATPase	60.3	60.1	43.8
MGA_2711	LOCUS_27030	sequence2:228227..229768(+)	partial			WP_002212255.1	ATPase RavA stimulator ViaA	74.3	75.6	29.7
MGA_2716	LOCUS_27080	sequence2:232971..236567(+)	partial			WP_000960581.1	STY4851/ECs_5259 family protein	47.9	50.8	22.5
MGA_2728	LOCUS_27200	sequence2:258053..270001(-)	partial			WP_011104106.1	type I polyketide synthase	25.3	31.5	48.1
MGA_2733	LOCUS_27250	sequence2:279967..280893(-)	partial			WP_009909131.1	AraC family transcriptional regulator	52.6	59.0	26.2
MGA_2734	LOCUS_27260	sequence2:281108..282013(-)	partial			WP_000140406.1	yersiniabactin transcriptional regulator YbtA	54.2	49.8	24.8
MGA_2740	LOCUS_27320	sequence2:289851..290090(+)	partial			WP_003089312.1	metalloregulator ArsR/SmtB family transcription factor	89.9	61.2	46.5
MGA_2764	LOCUS_27560	sequence2:316219..316401(+)	frameshift,internal_stop_codon	316113..316115(+),316176..316178(+),316194..316196(+),316417..316419(+),316471..316473(+)	316082,316388,316151	WP_086025317.1	IS1-like element ISYps7 family transposase	95.0	24.6	59.6
MGA_2770	LOCUS_27620	sequence2:321424..323976(-)	partial			WP_011105274.1	glycosyltransferase	52.1	46.5	24.8
MGA_2850	LOCUS_28420	sequence2:417101..417346(+)	partial			WP_005477197.1	hypothetical protein	53.1	60.6	58.1
MGA_2885	LOCUS_28770	sequence2:463737..464039(+)	partial			WP_000029435.1	chemotaxis protein CheC	44.0	22.7	63.6
MGA_2976	LOCUS_29680	sequence2:559256..560107(-)	partial			WP_011105416.1	IS66-like element ISPsy5 family transposase	98.9	54.9	47.3
MGA_2983	LOCUS_29750	sequence2:564060..565271(+)	partial			WP_004550247.1	lyase family protein	72.0	32.0	26.9
MGA_2998	LOCUS_29900	sequence2:580966..581175(-)	partial			WP_155655847.1	YkgJ family cysteine cluster protein	97.1	68.4	73.1
MGA_3009	LOCUS_30010	sequence2:593763..594272(-)	partial			WP_011016073.1	AAA family ATPase	74.6	78.8	28.5
MGA_3012	LOCUS_30040	sequence2:597562..598413(-)	partial			WP_011072702.1	nucleotide-binding protein	49.5	51.7	51.0
MGA_3040	LOCUS_30320	sequence2:634763..635209(-)	partial			WP_011459236.1	DUF3578 domain-containing protein	97.3	16.3	39.3
MGA_3056	LOCUS_30480	sequence2:657651..658139(-)	partial			WP_145772165.1	hypothetical protein	68.5	69.8	53.2
MGA_3081	LOCUS_30730	sequence2:692818..694602(-)	partial			WP_014206327.1	NACHT domain-containing protein	58.9	54.1	27.6
MGA_3083	LOCUS_30750	sequence2:696919..697659(-)	partial			WP_002657369.1	DnaJ domain-containing protein	37.4	34.4	41.7
MGA_3093	LOCUS_30850	sequence2:705526..705735(-)	partial			WP_155655847.1	YkgJ family cysteine cluster protein	97.1	68.4	73.1
MGA_3096	LOCUS_30880	sequence2:710244..711698(-)	partial			WP_013095757.1	hypothetical protein	66.7	68.3	24.3
MGA_3107	LOCUS_30990	sequence2:724636..725076(-)	partial			WP_164993988.1	TM2 domain-containing protein	54.8	35.5	41.4
MGA_3112	LOCUS_31040	sequence2:729579..730145(-)	partial			WP_000557907.1	5-methylcytosine-specific endonuclease McrA	47.9	32.9	46.7
MGA_3117	LOCUS_31090	sequence2:736267..736440(-)	partial			WP_005455023.1	antibiotic biosynthesis monooxygenase	96.5	58.5	58.2
MGA_3122	LOCUS_31140	sequence2:740727..741281(-)	partial			WP_005462179.1	hypothetical protein	31.0	21.9	57.9
MGA_3125	LOCUS_31170	sequence2:747293..748312(-)	partial			WP_011071330.1	DUF4062 domain-containing protein	55.2	52.9	34.3
MGA_3127	LOCUS_31190	sequence2:749975..750823(-)	partial			WP_000966077.1	DUF2971 domain-containing protein	54.6	54.6	26.0
MGA_3139	LOCUS_31310	sequence2:770136..771470(-)	partial			WP_011391484.1	P-loop NTPase fold protein	74.5	75.9	34.4
MGA_3149	LOCUS_31410	sequence2:788150..788638(-)	partial			WP_145772165.1	hypothetical protein	68.5	69.8	53.2
MGA_3164	LOCUS_31560	sequence2:808021..808302(-)	partial			WP_014164108.1	hypothetical protein	86.0	70.1	62.2
MGA_3176	LOCUS_31680	sequence2:824709..825098(-)	partial			WP_001894072.1	translation initiation factor IF-3	100.0	70.5	82.2
MGA_3256	LOCUS_32480	sequence2:923265..923546(+)	partial			WP_032471107.1	hypothetical protein	55.9	57.8	44.2
MGA_3285	LOCUS_32770	sequence2:963346..967431(-)	partial			WP_147443659.1	non-ribosomal peptide synthetase	96.5	12.2	31.7
MGA_3287	LOCUS_32790	sequence2:973183..973470(-)	frameshift		973516	WP_012296527.1	non-ribosomal peptide synthetase	67.4	5.7	39.1
MGA_3288	LOCUS_32800	sequence2:973511..975040(-)	frameshift,internal_stop_codon	973511..973513(-),973499..973501(-)	973456,973483,973501	WP_000503026.1	non-ribosomal peptide synthetase	96.7	22.9	42.1
MGA_3289	LOCUS_32810	sequence2:975074..978124(-)	partial			WP_234622323.1	non-ribosomal peptide synthase/polyketide synthase	98.6	9.0	29.2
MGA_3303	LOCUS_32950	sequence2:1007690..1009273(+)	partial			WP_200913519.1	cyclic diguanylate phosphodiesterase	51.6	52.6	31.9
MGA_3305	LOCUS_32970	sequence2:1010479..1010658(+)	partial			WP_005480125.1	alpha-amylase	83.1	7.1	71.4
MGA_3321	LOCUS_33130	sequence2:1027360..1028295(+)	partial			WP_001132384.1	hypothetical protein	100.0	63.6	72.7
MGA_3331	LOCUS_33230	sequence2:1038678..1038947(+)	partial			WP_000992651.1	hypothetical protein	100.0	64.0	65.2
MGA_3371	LOCUS_33630	sequence2:1083668..1085716(-)	partial			WP_000212116.1	type VI secretion system tip protein TssI/VgrG	99.4	58.3	72.0
MGA_3411	LOCUS_34030	sequence2:1141697..1142173(+)	frameshift		1142149	WP_000846694.1	spermidine/putrescine ABC transporter substrate-binding protein	95.6	43.7	80.8
MGA_3412	LOCUS_34040	sequence2:1142146..1142679(+)	frameshift		1142626,1142149,1142677	WP_000846694.1	spermidine/putrescine ABC transporter substrate-binding protein	95.5	49.3	84.6
MGA_3413	LOCUS_34050	sequence2:1142825..1143223(-)	frameshift		1143472,1143394,1142851,1143442,1143208,1143388,1143448	WP_000985780.1	ParB/RepB/Spo0J family partition protein	90.9	37.2	72.5
MGA_3414	LOCUS_34060	sequence2:1143208..1143387(-)	frameshift		1143472,1143394,1143442,1143208,1143388,1143448	WP_000985780.1	ParB/RepB/Spo0J family partition protein	96.6	17.6	91.2
MGA_3415	LOCUS_34070	sequence2:1143446..1143646(-)	frameshift		1143696,1143393,1143441,1143207,1143447,1143387,1143471	WP_000985780.1	ParB/RepB/Spo0J family partition protein	87.9	18.0	84.5
