# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_3	LOCUS_00020	sequence2:611..1381(-)	partial			WP_011176711.1	type I-C CRISPR-associated endonuclease Cas1c	100.0	74.6	54.3
MGA_18	LOCUS_00170	sequence2:17698..19074(+)	partial			WP_013390211.1	ribonuclease H	60.5	77.7	63.6
MGA_38	LOCUS_00370	sequence2:42468..43598(-)	partial			WP_022173241.1	tRNA pseudouridine synthase A	57.4	71.7	67.1
MGA_39	LOCUS_00380	sequence2:43709..44275(-)	partial			WP_003819143.1	50S ribosomal protein L17	63.3	70.0	84.9
MGA_77	LOCUS_00760	sequence2:69357..70361(-)	partial			WP_003972784.1	type II CAAX endopeptidase family protein	50.6	60.0	40.8
MGA_86	LOCUS_00850	sequence2:79134..79670(-)	internal_stop_codon	79134..79136(-)		WP_013390238.1	GNAT family protein	99.4	72.5	57.6
MGA_87	LOCUS_00860	sequence2:80357..80671(+)	partial			WP_012472143.1	5-formyltetrahydrofolate cyclo-ligase	85.6	35.4	50.6
MGA_115	LOCUS_01140	sequence2:118715..120481(+)	partial			WP_013389584.1	transglutaminase domain-containing protein	99.8	62.6	48.4
MGA_122	LOCUS_01210	sequence2:132757..134625(+)	partial			WP_011109529.1	BspA family leucine-rich repeat surface protein	12.5	7.2	52.6
MGA_140	LOCUS_01390	sequence2:156999..157568(-)	partial			WP_008782692.1	NINE protein	88.9	73.8	44.7
MGA_153	LOCUS_01520	sequence2:171997..172464(-)	frameshift,internal_stop_codon	172120..172122(-)	171984,171730,171893,171818,172140	WP_011068370.1	glucose-1-phosphate thymidylyltransferase RfbA	69.7	35.9	74.1
MGA_154	LOCUS_01530	sequence2:172635..172943(-)	frameshift,internal_stop_codon	172950..172952(-)	172952,172988,173069,173199	WP_004112126.1	bifunctional dTDP-4-dehydrorhamnose 3,5-epimerase family protein/NAD(P)-dependent oxidoreductase	94.1	19.6	39.6
MGA_155	LOCUS_01540	sequence2:173043..173222(-)	frameshift		172944,173019,173383,173067,173500,173197	WP_011068371.1	sugar nucleotide-binding protein	62.7	7.7	78.4
MGA_156	LOCUS_01550	sequence2:173550..173741(-)	frameshift		173793,173380,173591,173753,173500,173835,173868	WP_004112126.1	bifunctional dTDP-4-dehydrorhamnose 3,5-epimerase family protein/NAD(P)-dependent oxidoreductase	79.4	10.4	76.0
MGA_158	LOCUS_01570	sequence2:176237..176602(+)	frameshift,internal_stop_codon	176601..176603(+),176142..176144(+)	176609,176801,176183	WP_011068382.1	sugar transferase	95.0	20.4	50.4
MGA_182	LOCUS_01810	sequence2:207923..209956(-)	partial			WP_007051474.1	hypothetical protein	49.8	79.9	38.6
MGA_191	LOCUS_01900	sequence2:218400..218630(-)	partial			WP_003831420.1	ATP synthase F0 subunit C	73.7	74.7	78.6
MGA_199	LOCUS_01980	sequence2:225515..225955(-)	partial			WP_010886351.1	ABC transporter transmembrane domain-containing protein	95.2	24.1	41.7
MGA_207	LOCUS_02060	sequence2:231726..231965(+)	partial			WP_010948274.1	recombinase family protein	72.2	31.3	50.9
MGA_210	LOCUS_02090	sequence2:232682..236581(-)	partial			WP_011068089.1	LPXTG cell wall anchor domain-containing protein	80.3	64.9	46.4
MGA_233	LOCUS_02320	sequence2:263341..265902(-)	partial			WP_010989891.1	SpaA isopeptide-forming pilin-related protein	18.8	21.4	28.2
MGA_234	LOCUS_02330	sequence2:266177..267220(+)	partial			WP_011068474.1	HAD-IC family P-type ATPase	36.9	14.2	44.5
MGA_243	LOCUS_02420	sequence2:277214..277462(-)	partial			WP_002262052.1	aminodeoxychorismate/anthranilate synthase component II	53.7	23.5	54.5
MGA_246	LOCUS_02450	sequence2:280887..281663(-)	partial			WP_003811773.1	DUF3152 domain-containing protein	69.8	64.7	58.3
MGA_247	LOCUS_02460	sequence2:282251..284806(-)	partial			WP_010989462.1	class 1 internalin InlA	27.3	29.1	32.6
MGA_260	LOCUS_02590	sequence2:298493..300988(-)	partial			WP_009994855.1	type 2 isopentenyl-diphosphate Delta-isomerase	43.0	43.2	51.5
MGA_268	LOCUS_02660	sequence2:309801..310118(-)	partial			WP_013389335.1	PTS ascorbate transporter subunit IIC	79.0	16.4	69.9
MGA_269	LOCUS_02670	sequence2:310232..310795(+)	frameshift		310702	WP_003817399.1	LacI family DNA-binding transcriptional regulator	85.0	45.4	44.7
MGA_283	LOCUS_02800	sequence2:331087..331296(-)	partial			WP_013390264.1	LacI family DNA-binding transcriptional regulator	71.0	54.4	51.0
MGA_304	LOCUS_03010	sequence2:350376..351161(+)	partial			WP_011030525.1	TetR/AcrR family transcriptional regulator	42.1	55.6	41.8
MGA_313	LOCUS_03100	sequence2:360428..362791(+)	partial			WP_011068490.1	YhgE/Pip domain-containing protein	69.9	76.4	47.5
MGA_315	LOCUS_03120	sequence2:363759..365558(-)	partial			WP_011068492.1	ABC transporter permease	35.9	52.3	59.1
MGA_388	LOCUS_03820	sequence3:91778..93682(-)	partial			WP_003815928.1	chromosomal replication initiator protein DnaA	65.6	80.3	77.4
MGA_399	LOCUS_03930	sequence3:105229..105750(+)	partial			WP_013389385.1	cell division protein CrgA	70.5	81.5	58.1
MGA_400	LOCUS_03940	sequence3:106320..108464(+)	partial			WP_010933192.1	leucine-rich repeat domain-containing protein	34.5	20.3	31.3
MGA_403	LOCUS_03970	sequence3:113564..114451(+)	partial			WP_011068518.1	class C sortase	76.3	62.3	52.8
MGA_414	LOCUS_04080	sequence3:130520..132442(+)	partial			WP_011068543.1	trypsin-like peptidase domain-containing protein	63.8	61.6	61.5
MGA_415	LOCUS_04090	sequence3:132795..135434(+)	partial			WP_013389405.1	heavy metal translocating P-type ATPase	68.6	78.9	49.6
MGA_439	LOCUS_04330	sequence3:162148..162492(-)	partial			WP_013390354.1	hypothetical protein	94.7	39.1	40.7
MGA_447	LOCUS_04410	sequence3:170781..171635(+)	partial			WP_000531489.1	tyrosine-protein phosphatase	85.2	73.5	29.4
MGA_456	LOCUS_04500	sequence3:183074..184219(-)	frameshift		184332,184350	WP_010989462.1	class 1 internalin InlA	46.5	22.2	43.3
MGA_462	LOCUS_04560	sequence3:189699..190496(+)	partial			WP_013390253.1	DUF1524 domain-containing protein	74.7	57.6	65.7
MGA_465	LOCUS_04590	sequence3:193200..196610(+)	partial			WP_010941906.1	choice-of-anchor D domain-containing protein	35.0	18.5	34.0
MGA_466	LOCUS_04600	sequence3:197395..201237(-)	partial			WP_000080564.1	DEAD/DEAH box helicase	68.5	81.0	27.1
MGA_479	LOCUS_04730	sequence3:216765..218456(+)	partial			WP_013222952.1	glycosyltransferase family 4 protein	64.3	78.3	39.9
MGA_495	LOCUS_04890	sequence3:237927..238241(+)	partial			WP_012803798.1	D-galactonate dehydratase family protein	100.0	25.2	65.4
MGA_498	LOCUS_04920	sequence3:240068..240634(+)	frameshift		240792	WP_013389421.1	evolved beta-galactosidase subunit alpha	84.6	12.3	63.5
MGA_499	LOCUS_04930	sequence3:240824..241270(+)	frameshift,internal_stop_codon	241268..241270(+)	240792	WP_013389421.1	evolved beta-galactosidase subunit alpha	45.3	5.2	56.7
MGA_500	LOCUS_04940	sequence3:241283..241714(+)	internal_stop_codon	241268..241270(+)		WP_013389421.1	evolved beta-galactosidase subunit alpha	90.9	13.0	36.3
MGA_501	LOCUS_04950	sequence3:241720..241962(+)	partial			WP_013389421.1	evolved beta-galactosidase subunit alpha	90.0	5.6	59.7
MGA_502	LOCUS_04960	sequence3:241887..242159(+)	partial			WP_013389421.1	evolved beta-galactosidase subunit alpha	73.3	5.1	63.6
MGA_519	LOCUS_05130	sequence3:263922..265340(-)	partial			WP_016507753.1	NUDIX hydrolase	67.4	82.5	48.5
MGA_524	LOCUS_05180	sequence3:271853..274432(-)	partial			WP_011109529.1	BspA family leucine-rich repeat surface protein	20.6	20.3	37.3
MGA_535	LOCUS_05290	sequence3:286659..287312(+)	partial			WP_010990076.1	DUF1310 domain-containing protein	44.7	73.0	40.2
MGA_537	LOCUS_05310	sequence3:287706..288722(+)	frameshift		287691	WP_009930426.1	DUF2974 domain-containing protein	98.2	68.9	33.1
MGA_540	LOCUS_05340	sequence3:289597..290397(-)	partial			WP_013389537.1	ribosome maturation factor RimM	59.4	77.0	67.7
MGA_554	LOCUS_05480	sequence3:304400..305311(-)	partial			WP_007057854.1	cell division protein	81.2	74.0	48.0
MGA_578	LOCUS_05700	sequence4:11853..12617(+)	partial			WP_010081174.1	signal peptidase I	72.0	64.9	58.4
MGA_593	LOCUS_05850	sequence4:41780..42703(+)	partial			WP_214304241.1	cobyric acid synthase	94.5	73.3	20.2
MGA_595	LOCUS_05870	sequence4:43696..44388(+)	partial			WP_013363997.1	pilus assembly protein	73.9	72.6	37.1
MGA_614	LOCUS_06060	sequence4:72572..73246(+)	partial			WP_013389591.1	GNAT family N-acetyltransferase	95.5	73.3	47.7
MGA_628	LOCUS_06200	sequence4:95285..95524(+)	partial			WP_007055942.1	very short patch repair endonuclease	83.5	44.4	64.2
MGA_632	LOCUS_06240	sequence4:98498..99022(-)	frameshift		98568,99030	WP_003689349.1	Re/Si-specific NAD(P)(+) transhydrogenase subunit beta	89.1	33.6	74.2
MGA_647	LOCUS_06390	sequence4:117692..118960(-)	partial			WP_013389417.1	MFS transporter	84.4	65.6	27.6
MGA_656	LOCUS_06480	sequence4:130456..131004(-)	frameshift		130500,131165,131014	WP_010819456.1	PfkB family carbohydrate kinase	91.8	26.2	38.9
MGA_658	LOCUS_06500	sequence4:131180..131650(-)	frameshift		131165,131014	WP_010819456.1	PfkB family carbohydrate kinase	72.4	17.9	36.0
MGA_659	LOCUS_06510	sequence4:132003..132392(+)	frameshift		132365	WP_003814258.1	HAD-IC family P-type ATPase	90.7	13.4	49.2
MGA_670	LOCUS_06620	sequence4:150469..152319(-)	partial			WP_011109529.1	BspA family leucine-rich repeat surface protein	17.0	10.7	52.3
MGA_685	LOCUS_06760	sequence4:167652..168950(+)	partial			WP_007053293.1	DivIVA domain-containing protein	77.3	61.0	45.3
MGA_707	LOCUS_06980	sequence4:192874..193134(+)	frameshift,internal_stop_codon	193134..193136(+)	192896,193074,193094,193078,193118	WP_003548204.1	glycoside hydrolase family 78 protein	96.5	8.9	57.8
MGA_709	LOCUS_07000	sequence4:193572..193961(+)	frameshift		194116	WP_003548204.1	glycoside hydrolase family 78 protein	93.8	13.0	45.5
MGA_712	LOCUS_07030	sequence4:194661..195071(+)	frameshift,internal_stop_codon	194585..194587(+),194972..194974(+)	194512,194947,194551	WP_011476249.1	beta-phosphoglucomutase	84.6	51.6	50.4
MGA_715	LOCUS_07060	sequence4:197847..198593(-)	partial			WP_013389652.1	hypothetical protein	97.6	69.5	62.8
MGA_724	LOCUS_07150	sequence4:209922..210239(+)	partial			WP_013389656.1	transcriptional regulator NrdR	97.1	65.8	75.5
MGA_739	LOCUS_07300	sequence4:229744..230106(+)	internal_stop_codon	230104..230106(+)		WP_009994219.1	extracellular solute-binding protein	74.2	20.0	48.3
MGA_740	LOCUS_07310	sequence4:230116..230445(+)	frameshift,internal_stop_codon	230443..230445(+),230104..230106(+),230607..230609(+)	230569,230550	WP_043786697.1	extracellular solute-binding protein	95.4	24.3	41.3
MGA_741	LOCUS_07320	sequence4:230610..230834(+)	frameshift,internal_stop_codon	230608..230610(+),230443..230445(+)	230562,230766	WP_009994219.1	extracellular solute-binding protein	70.3	11.9	47.2
MGA_743	LOCUS_07340	sequence4:231233..232018(+)	frameshift		231952,231877,232007	WP_009994218.1	sugar ABC transporter permease	95.8	78.9	48.1
MGA_744	LOCUS_07350	sequence4:232125..232547(+)	partial			WP_013225176.1	carbohydrate ABC transporter permease	78.6	40.4	41.8
MGA_745	LOCUS_07360	sequence4:232551..232799(+)	partial			WP_003817047.1	N-acetylglucosamine-6-phosphate deacetylase	92.7	18.2	76.3
MGA_755	LOCUS_07460	sequence4:248028..248723(+)	partial			WP_007057260.1	sigma-70 family RNA polymerase sigma factor	79.7	73.6	79.3
MGA_756	LOCUS_07470	sequence4:248749..249042(+)	partial			WP_013389679.1	hypothetical protein	58.8	45.1	59.6
MGA_769	LOCUS_07600	sequence4:261364..262215(+)	partial			WP_011068017.1	SMC-Scp complex subunit ScpB	69.6	82.8	67.2
MGA_779	LOCUS_07700	sequence4:272658..272891(-)	internal_stop_codon	272658..272660(-)		WP_012582801.1	ABC transporter permease	80.5	18.9	48.4
MGA_780	LOCUS_07710	sequence4:273066..273746(-)	frameshift		273068	WP_012582800.1	sugar ABC transporter ATP-binding protein	100.0	46.2	47.2
MGA_785	LOCUS_07760	sequence4:277713..278201(+)	partial			WP_013389699.1	sugar ABC transporter substrate-binding protein	96.3	72.5	33.1
MGA_804	LOCUS_07950	sequence4:305619..306488(+)	partial			WP_013389505.1	class C sortase	87.2	65.5	57.4
MGA_829	LOCUS_08200	sequence4:344347..344589(+)	partial			WP_007055377.1	hypothetical protein	71.2	77.0	52.6
MGA_850	LOCUS_08410	sequence4:376568..377287(-)	partial			WP_003644001.1	NCS2 family permease	64.4	35.4	61.7
MGA_860	LOCUS_08510	sequence4:390161..390334(+)	frameshift		390204	WP_004193507.1	2-hydroxyacid dehydrogenase family protein	71.9	12.9	68.3
MGA_862	LOCUS_08530	sequence4:391652..391858(+)	frameshift,internal_stop_codon	391528..391530(+)	391488,391664,391554,391497,391627,391407	WP_013389559.1	FGGY-family carbohydrate kinase	72.1	9.7	55.1
MGA_863	LOCUS_08540	sequence4:391869..392162(+)	frameshift,internal_stop_codon	392209..392211(+),392326..392328(+),391856..391858(+)	392168,391897,392265,392093	WP_011674994.1	L-ribulose-5-phosphate 3-epimerase	67.0	22.5	73.8
MGA_864	LOCUS_08550	sequence4:392399..392626(+)	frameshift,internal_stop_codon	392325..392327(+),392208..392210(+)	392264,392167	WP_011674994.1	L-ribulose-5-phosphate 3-epimerase	98.7	25.6	64.9
MGA_871	LOCUS_08620	sequence4:400850..403423(+)	partial			WP_137656711.1	primosomal protein N'	44.5	51.3	65.4
MGA_882	LOCUS_08730	sequence4:416246..416893(-)	partial			WP_013389711.1	DUF6466 family protein	74.0	78.1	33.5
MGA_885	LOCUS_08760	sequence4:419009..419614(-)	partial			WP_021975282.1	hypothetical protein	72.1	79.9	48.3
MGA_893	LOCUS_08840	sequence4:425900..426604(+)	partial			WP_017143311.1	hypothetical protein	94.0	58.0	42.6
MGA_939	LOCUS_09300	sequence4:494214..494966(+)	partial			WP_013222252.1	SGNH/GDSL hydrolase family protein	71.2	77.8	35.0
MGA_942	LOCUS_09330	sequence4:497540..498655(+)	partial			WP_013390015.1	helicase	99.5	47.1	51.1
MGA_951	LOCUS_09420	sequence4:506608..507111(+)	frameshift		506449,506554,506467	WP_011068267.1	ABC transporter ATP-binding protein	91.6	50.3	63.0
MGA_968	LOCUS_09590	sequence4:523750..524556(+)	frameshift		523694	WP_013389977.1	transporter substrate-binding domain-containing protein	94.0	77.0	38.7
MGA_980	LOCUS_09710	sequence4:535649..536257(+)	partial			WP_011068095.1	M23 family metallopeptidase	71.8	63.8	45.2
MGA_1018	LOCUS_10090	sequence4:573468..574412(+)	partial			WP_013399605.1	aquaporin	77.7	74.4	45.9
MGA_1031	LOCUS_10220	sequence4:586050..586742(-)	partial			WP_005082398.1	phosphatidylinositol mannoside acyltransferase	84.8	55.5	36.7
MGA_1052	LOCUS_10430	sequence4:608505..611243(-)	partial			WP_013582770.1	excinuclease ABC subunit UvrC	40.5	46.4	67.2
MGA_1069	LOCUS_10600	sequence4:635340..636053(-)	frameshift		636070	WP_003812945.1	ATP-binding cassette domain-containing protein	97.9	80.9	58.4
MGA_1121	LOCUS_11120	sequence4:695171..697978(-)	partial			WP_013389805.1	exodeoxyribonuclease V subunit gamma	74.5	78.8	79.1
MGA_1126	LOCUS_11170	sequence4:701291..701632(-)	frameshift,internal_stop_codon	701300..701302(-)	700998,701350,701624,701100,701263	WP_003646328.1	aldo/keto reductase	80.5	32.3	54.9
MGA_1133	LOCUS_11240	sequence4:712753..713259(+)	partial			WP_046247583.1	helix-turn-helix domain-containing protein	37.5	38.0	46.0
MGA_1138	LOCUS_11290	sequence4:718475..718819(-)	partial			WP_011391392.1	NAD-dependent protein deacylase	68.4	32.5	39.2
MGA_1163	LOCUS_11540	sequence4:747468..747830(-)	partial			WP_013582487.1	phosphoribosyltransferase family protein	96.7	47.1	40.2
MGA_1191	LOCUS_11820	sequence4:784615..784950(-)	partial			WP_011728707.1	SDR family oxidoreductase	51.4	26.4	54.4
MGA_1201	LOCUS_11920	sequence4:797865..798755(-)	partial			WP_162098246.1	ABC transporter ATP-binding protein	85.1	72.9	78.3
MGA_1206	LOCUS_11970	sequence4:804707..805723(+)	frameshift,internal_stop_codon	805466..805468(+)	805405	WP_011068209.1	DNA-processing protein DprA	68.6	42.2	59.0
MGA_1213	LOCUS_12040	sequence4:811916..812827(+)	partial			WP_010989478.1	BspA family leucine-rich repeat surface protein	43.2	17.9	36.6
MGA_1218	LOCUS_12090	sequence4:817185..818525(-)	partial			WP_011068213.1	chloride channel protein	65.5	59.8	53.7
MGA_1230	LOCUS_12210	sequence4:832620..833837(+)	partial			WP_013226921.1	MFS transporter	71.9	70.2	23.5
MGA_1246	LOCUS_12370	sequence4:852802..853341(-)	partial			WP_004138146.1	single-stranded DNA-binding protein	92.2	74.8	41.1
MGA_1277	LOCUS_12680	sequence4:892501..893364(-)	partial			WP_011068791.1	2-amino-4-hydroxy-6-hydroxymethyldihydropteridine diphosphokinase	75.6	42.6	43.4
MGA_1286	LOCUS_12770	sequence4:903743..904687(+)	partial			WP_011476124.1	polyprenyl synthetase family protein	68.5	65.2	34.3
MGA_1308	LOCUS_12990	sequence4:925074..925940(-)	partial			WP_003814664.1	1,4-dihydroxy-2-naphthoate octaprenyltransferase	71.5	64.2	56.8
MGA_1310	LOCUS_13010	sequence4:928428..928892(+)	internal_stop_codon	928890..928892(+)		WP_007053838.1	MFS transporter	100.0	38.9	64.9
MGA_1311	LOCUS_13020	sequence4:928911..929615(+)	internal_stop_codon	928890..928892(+)		WP_013390199.1	MFS transporter	98.3	58.2	63.5
