# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_17	LOCUS_00170	sequence1:15673..16251(+)	partial			WP_005173797.1	lytic transglycosylase domain-containing protein	55.7	70.3	37.5
MGA_49	LOCUS_00490	sequence1:49311..49922(+)	partial			WP_011166827.1	BspA family leucine-rich repeat surface protein	84.2	45.2	33.1
MGA_66	LOCUS_00660	sequence1:68939..69313(+)	partial			WP_002851214.1	50S ribosomal protein L22	83.1	73.0	93.2
MGA_136	LOCUS_01360	sequence1:125847..126491(-)	partial			WP_002858642.1	putative metalloprotease CJM1_0395 family protein	80.8	73.9	54.6
MGA_222	LOCUS_02220	sequence1:205568..207430(+)	partial			WP_002888535.1	McrB family protein	84.5	71.0	52.4
MGA_265	LOCUS_02650	sequence1:244078..244680(-)	partial			WP_102756879.1	BspA family leucine-rich repeat surface protein	82.0	28.0	40.5
MGA_299	LOCUS_02990	sequence1:277904..281263(+)	partial			WP_011100946.1	glycosyltransferase	66.4	82.5	31.4
MGA_300	LOCUS_03000	sequence1:281277..283157(+)	partial			WP_002858440.1	capsule biosynthesis protein CapA	71.6	75.4	28.7
MGA_301	LOCUS_03010	sequence1:283245..285095(+)	partial			WP_002858440.1	capsule biosynthesis protein CapA	70.1	73.7	27.4
MGA_304	LOCUS_03040	sequence1:286806..287573(+)	frameshift		287570	WP_008763415.1	GDP-L-fucose synthase	100.0	74.2	54.5
MGA_309	LOCUS_03090	sequence1:291170..292711(+)	partial			WP_002858440.1	capsule biosynthesis protein CapA	30.0	24.4	45.5
MGA_313	LOCUS_03130	sequence1:294315..294911(-)	partial			WP_011263798.1	DUF2589 domain-containing protein	91.4	66.8	48.2
MGA_324	LOCUS_03240	sequence1:306577..307050(+)	partial			WP_002867614.1	lysophospholipid acyltransferase family protein	99.4	74.6	63.5
MGA_376	LOCUS_03750	sequence1:359629..359832(+)	partial			WP_002851307.1	cytochrome c oxidase, cbb3-type, CcoQ subunit	86.6	65.5	69.0
MGA_402	LOCUS_04010	sequence1:385078..385782(-)	partial			WP_002851142.1	DUF5644 domain-containing protein	57.7	36.7	50.4
MGA_403	LOCUS_04020	sequence1:385793..386431(-)	partial			WP_002851142.1	DUF5644 domain-containing protein	97.2	56.3	48.3
MGA_420	LOCUS_04190	sequence1:400145..402520(+)	partial			WP_011021623.1	tetratricopeptide repeat protein	91.8	39.2	20.4
MGA_450	LOCUS_04480	sequence1:438417..439049(+)	partial			WP_014565877.1	flavodoxin	65.7	37.1	30.0
MGA_452	LOCUS_04500	sequence1:440521..441438(-)	partial			WP_010891843.1	putative transporter	88.5	70.3	72.3
MGA_456	LOCUS_04540	sequence1:445123..445326(-)	partial			WP_002858725.1	transcriptional regulator	76.1	73.9	80.4
MGA_460	LOCUS_04580	sequence1:453233..453820(+)	partial			WP_002853306.1	ATP-dependent DNA helicase Pif1	97.4	42.1	60.9
MGA_464	LOCUS_04620	sequence1:455656..456300(-)	partial			WP_005902260.1	helix-turn-helix transcriptional regulator	65.4	62.1	30.6
MGA_500	LOCUS_04980	sequence1:486894..487922(-)	partial			WP_002853187.1	hypothetical protein	61.4	59.5	30.8
MGA_514	LOCUS_05120	sequence1:505857..509888(+)	partial			WP_005694039.1	heme/hemopexin-binding protein HxuA	36.6	55.5	23.1
MGA_516	LOCUS_05140	sequence1:512125..512373(-)	partial			WP_002853490.1	CinA family protein	96.3	21.8	63.3
MGA_538	LOCUS_05360	sequence1:541036..542628(-)	partial			WP_002865311.1	methyl-accepting chemotaxis protein	64.7	56.6	29.4
MGA_563	LOCUS_05610	sequence1:566080..568218(-)	partial			WP_000874574.1	vacuolating cytotoxin domain-containing protein	84.6	25.5	25.7
MGA_571	LOCUS_05690	sequence1:576388..576666(-)	partial			WP_002852414.1	AtpZ/AtpI family protein	87.0	73.4	77.5
MGA_592	LOCUS_05900	sequence1:595873..596532(-)	partial			WP_015705435.1	DUF2169 domain-containing protein	62.6	14.4	27.5
MGA_593	LOCUS_05910	sequence1:596543..597223(-)	partial			WP_010714143.1	Rha family transcriptional regulator	50.4	53.8	38.7
MGA_608	LOCUS_06060	sequence1:605565..605741(-)	internal_stop_codon	605805..605807(-)		WP_002852117.1	DNA/RNA non-specific endonuclease	94.8	25.5	60.0
MGA_609	LOCUS_06070	sequence1:605805..606224(-)	internal_stop_codon	605805..605807(-)		WP_002852117.1	DNA/RNA non-specific endonuclease	85.6	55.1	73.1
MGA_621	LOCUS_06190	sequence1:611643..612935(+)	partial			WP_014626412.1	DEAD/DEAH box helicase family protein	62.6	57.3	24.1
MGA_628	LOCUS_06260	sequence1:616910..621076(+)	frameshift		621070	WP_000775280.1	DUF3519 domain-containing protein	19.2	28.5	32.0
MGA_629	LOCUS_06270	sequence1:621990..623159(+)	partial			WP_000775280.1	DUF3519 domain-containing protein	37.8	16.4	34.1
MGA_630	LOCUS_06280	sequence1:623771..625417(+)	partial			WP_000775280.1	DUF3519 domain-containing protein	70.8	43.4	26.1
MGA_634	LOCUS_06320	sequence1:626749..627474(+)	partial			WP_011069307.1	Rha family phage regulatory protein	43.6	33.3	43.4
MGA_670	LOCUS_06680	sequence1:662382..662777(+)	internal_stop_codon	662322..662324(+)		WP_011085759.1	PAS domain-containing protein	98.5	77.5	45.5
MGA_671	LOCUS_06690	sequence1:662752..664125(+)	partial			WP_002790076.1	bipartate energy taxis response protein CetA	71.6	72.8	29.0
MGA_693	LOCUS_06910	sequence1:686755..687420(-)	partial			WP_002852518.1	ABC transporter permease	95.9	70.0	61.8
MGA_710	LOCUS_07080	sequence1:703598..703954(+)	partial			WP_002852364.1	membrane protein	100.0	72.0	48.3
MGA_716	LOCUS_07140	sequence1:709035..709355(+)	partial			WP_010943583.1	metalloregulator ArsR/SmtB family transcription factor	58.5	54.9	50.0
MGA_718	LOCUS_07160	sequence1:709765..710070(+)	frameshift		710031	WP_010933386.1	ACR3 family arsenite efflux transporter	87.1	25.1	46.6
MGA_719	LOCUS_07170	sequence1:710036..710779(+)	frameshift		710031	WP_004398718.1	arsenite efflux transporter Acr3	99.6	70.8	50.8
MGA_753	LOCUS_07510	sequence1:746728..749922(+)	partial			WP_003115288.1	two-partner secretion system exoprotein TpsA4	23.0	17.0	28.3
MGA_761	LOCUS_07590	sequence1:759558..759932(-)	partial			WP_012256140.1	rhodanese-like domain-containing protein	75.0	62.5	34.4
MGA_803	LOCUS_08010	sequence1:797464..798429(-)	frameshift		798432,798471	WP_002864146.1	hypothetical protein	99.7	75.8	65.7
MGA_804	LOCUS_08020	sequence1:798454..798717(-)	frameshift		798432,798471	WP_002864146.1	hypothetical protein	74.7	18.1	49.4
MGA_832	LOCUS_08300	sequence1:821952..824243(-)	partial			WP_002864504.1	flagellar filament capping protein FliD	62.3	75.7	37.6
MGA_865	LOCUS_08630	sequence1:854056..854520(-)	frameshift		854729	WP_002864247.1	DUF2920 family protein	96.1	36.6	47.4
MGA_866	LOCUS_08640	sequence1:854709..855332(-)	frameshift		854729	WP_002864247.1	DUF2920 family protein	87.0	46.2	38.3
MGA_874	LOCUS_08720	sequence1:861759..862394(+)	partial			WP_011263976.1	S24 family peptidase	55.9	58.6	35.0
MGA_912	LOCUS_09100	sequence1:917542..918312(-)	partial			WP_010634228.1	type IVB secretion system protein IcmH/DotU	55.1	53.3	34.0
MGA_974	LOCUS_09720	sequence1:979593..980846(+)	partial			WP_003113036.1	GLUG motif-containing protein	53.5	20.3	30.0
MGA_1024	LOCUS_10220	sequence1:1024398..1026722(+)	partial			WP_000874574.1	vacuolating cytotoxin domain-containing protein	34.5	10.7	25.4
MGA_1027	LOCUS_10250	sequence1:1027888..1028523(+)	partial			WP_002853271.1	AEC family transporter	99.5	69.3	57.1
MGA_1033	LOCUS_10310	sequence1:1035989..1038217(+)	partial			WP_000874574.1	vacuolating cytotoxin domain-containing protein	94.5	26.2	22.6
MGA_1114	LOCUS_11120	sequence1:1114842..1115189(+)	frameshift		1115145,1115226,1114743	WP_011986663.1	class I SAM-dependent methyltransferase	88.7	41.5	41.2
MGA_1140	LOCUS_11380	sequence1:1138037..1139635(-)	partial			WP_002852900.1	hypothetical protein	42.9	39.5	40.2
MGA_1168	LOCUS_11660	sequence1:1165352..1165780(+)	partial			WP_002852989.1	hypothetical protein	72.5	71.8	41.1
MGA_1199	LOCUS_11970	sequence1:1193150..1194091(-)	internal_stop_codon	1194260..1194262(-)		WP_002857955.1	2-iminoacetate synthase ThiH	99.4	81.6	77.8
MGA_1206	LOCUS_12040	sequence1:1198472..1201279(-)	frameshift		1201290	WP_002864285.1	N-6 DNA methylase	100.0	69.5	68.3
MGA_1207	LOCUS_12050	sequence1:1201276..1202502(-)	frameshift		1201293	WP_002864285.1	N-6 DNA methylase	99.8	30.4	95.8
MGA_1211	LOCUS_12090	sequence1:1206429..1207991(-)	frameshift		1208173	WP_010891905.1	LTA synthase family protein	98.1	78.2	51.1
MGA_1212	LOCUS_12100	sequence1:1208150..1208401(-)	frameshift		1208173	WP_010891905.1	LTA synthase family protein	81.9	11.1	42.5
MGA_1220	LOCUS_12180	sequence1:1218555..1221407(-)	partial			WP_003115288.1	two-partner secretion system exoprotein TpsA4	16.4	10.4	33.3
MGA_1241	LOCUS_12390	sequence1:1243248..1243520(+)	frameshift,internal_stop_codon	1243495..1243497(+)	1243484	WP_010891905.1	LTA synthase family protein	95.6	13.2	55.7
MGA_1242	LOCUS_12400	sequence1:1243717..1245219(+)	frameshift,internal_stop_codon	1243495..1243497(+)	1243484	WP_010891905.1	LTA synthase family protein	99.6	76.0	61.7
MGA_1293	LOCUS_12910	sequence1:1299808..1302201(+)	partial			WP_003112847.1	phosphoethanolamine transferase CptA	42.7	55.5	29.4
MGA_1329	LOCUS_13270	sequence1:1343445..1344689(-)	partial			WP_003113036.1	GLUG motif-containing protein	49.3	20.3	26.8
MGA_1361	LOCUS_13590	sequence1:1376571..1377305(+)	partial			WP_015444193.1	amino acid adenylation domain-containing protein	88.9	16.5	32.0
MGA_1368	LOCUS_13660	sequence1:1382153..1382383(+)	partial			WP_010881114.1	acyl carrier protein	64.5	62.8	44.9
MGA_1371	LOCUS_13690	sequence1:1383627..1384199(+)	partial			WP_002856586.1	N-acetyltransferase LegH	98.9	70.7	50.5
MGA_1434	LOCUS_14320	sequence1:1443965..1444750(+)	partial			WP_010921944.1	ADP-ribosyltransferase	69.3	71.6	29.9
MGA_1449	LOCUS_14470	sequence1:1456385..1457005(-)	partial			WP_000892717.1	Sel1-like repeat protein HcpC	85.0	60.3	50.9
MGA_1512	LOCUS_15100	sequence1:1512798..1514939(-)	partial			WP_002788173.1	pentapeptide repeat-containing protein	45.9	73.5	27.7
MGA_1566	LOCUS_15640	sequence1:1579936..1580940(+)	partial			WP_002805290.1	flagellar basal body rod modification protein	37.1	42.2	58.9
MGA_1581	LOCUS_15790	sequence1:1598413..1601253(+)	partial			WP_011816940.1	filamentous hemagglutinin N-terminal domain-containing protein	15.1	6.5	34.5
MGA_1617	LOCUS_16150	sequence1:1639314..1640318(+)	frameshift		1640312,1640331	WP_209021411.1	Dam family site-specific DNA-(adenine-N6)-methyltransferase	97.6	45.3	40.7
MGA_1618	LOCUS_16160	sequence1:1640318..1641229(+)	frameshift		1640312,1640331	WP_209021411.1	Dam family site-specific DNA-(adenine-N6)-methyltransferase	96.4	40.7	33.7
