# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_1	LOCUS_00010	sequence1:1..8696(+)	partial			WP_004552911.1	trimeric autotransporter adhesin BpaB	17.8	49.4	30.3
MGA_13	LOCUS_00130	sequence1:22150..22551(-)	partial			WP_002799196.1	prepilin-type N-terminal cleavage/methylation domain-containing protein	65.4	55.6	35.8
MGA_38	LOCUS_00380	sequence1:50191..53268(-)	partial			WP_003113909.1	DUF748 domain-containing protein	40.7	40.3	28.6
MGA_47	LOCUS_00470	sequence1:62956..65367(-)	partial			WP_011787412.1	autotransporter domain-containing protein	29.6	33.1	26.6
MGA_50	LOCUS_00500	sequence1:67988..68767(+)	partial			WP_010919317.1	cystine ABC transporter substrate-binding protein	68.0	70.5	32.6
MGA_56	LOCUS_00560	sequence1:71940..72275(-)	partial			WP_010940947.1	cytochrome c3 family protein	95.5	17.3	43.0
MGA_63	LOCUS_00630	sequence1:78217..78783(-)	partial			WP_011120381.1	lipid-binding SYLF domain-containing protein	71.8	38.3	24.1
MGA_65	LOCUS_00650	sequence1:80278..80901(-)	partial			WP_164922815.1	5-formyltetrahydrofolate cyclo-ligase	53.1	59.4	25.8
MGA_89	LOCUS_00890	sequence1:102383..103009(+)	frameshift		103006	WP_002858733.1	diaminopimelate decarboxylase	100.0	51.7	70.7
MGA_90	LOCUS_00900	sequence1:103060..103566(+)	frameshift		103006	WP_002858733.1	diaminopimelate decarboxylase	100.0	38.6	52.4
MGA_113	LOCUS_01130	sequence1:126357..127640(+)	partial			WP_002858145.1	N-acetylmuramoyl-L-alanine amidase	61.6	38.2	56.4
MGA_136	LOCUS_01360	sequence1:148895..149089(-)	partial			WP_002852866.1	twin-arginine translocase TatA/TatE family subunit	92.2	69.6	62.7
MGA_137	LOCUS_01370	sequence1:149116..149307(-)	partial			WP_011014401.1	Sec-independent protein translocase subunit TatA	77.8	46.7	49.0
MGA_142	LOCUS_01420	sequence1:152701..154014(+)	partial			WP_008767132.1	endonuclease	41.0	62.4	26.5
MGA_155	LOCUS_01550	sequence1:170176..170904(-)	partial			WP_116269310.1	tetratricopeptide repeat protein	87.6	49.2	48.1
MGA_156	LOCUS_01560	sequence1:171015..171485(-)	partial			WP_116269310.1	tetratricopeptide repeat protein	89.7	32.5	49.3
MGA_168	LOCUS_01680	sequence1:187433..188605(+)	partial			WP_000880885.1	MotA/TolQ/ExbB proton channel family protein	61.5	41.1	23.6
MGA_186	LOCUS_01860	sequence1:202538..203671(+)	partial			WP_012061641.1	calcium-binding protein	26.0	49.3	38.9
MGA_188	LOCUS_01880	sequence1:204523..206121(+)	partial			WP_149323728.1	calcium-binding protein	21.2	8.4	39.7
MGA_190	LOCUS_01900	sequence1:207155..208543(+)	partial			WP_011038707.1	DUF2974 domain-containing protein	53.2	55.6	27.3
MGA_193	LOCUS_01930	sequence1:210267..213053(+)	partial			WP_158707352.1	calcium-binding protein	24.8	13.4	39.6
MGA_196	LOCUS_01960	sequence1:213943..214719(+)	frameshift		214680,214641,214635,214668	WP_003529018.1	calcium-binding protein	27.5	37.0	37.0
MGA_197	LOCUS_01970	sequence1:214719..216005(+)	frameshift		214668	WP_158707352.1	calcium-binding protein	47.4	11.6	35.9
MGA_202	LOCUS_02020	sequence1:218875..220731(+)	partial			WP_158707352.1	calcium-binding protein	27.7	9.7	43.0
MGA_214	LOCUS_02140	sequence1:232648..234315(-)	partial			WP_002865516.1	anaerobic C4-dicarboxylate transporter	51.5	59.9	67.5
MGA_218	LOCUS_02180	sequence1:237340..238131(-)	partial			WP_013227552.1	PhnD/SsuA/transferrin family substrate-binding protein	69.2	83.4	41.9
MGA_231	LOCUS_02310	sequence1:252633..253601(+)	partial			WP_002858001.1	acetyl-CoA carboxylase biotin carboxylase subunit	99.7	72.2	70.1
MGA_275	LOCUS_02750	sequence1:303416..305197(-)	partial			WP_007329982.1	Na/Pi cotransporter family protein	59.0	64.8	25.5
MGA_281	LOCUS_02810	sequence1:311384..312604(+)	frameshift		312598	WP_011109303.1	DUF262 domain-containing protein	37.2	26.3	37.4
MGA_282	LOCUS_02820	sequence1:312651..313454(-)	partial			WP_005798360.1	[FeFe] hydrogenase H-cluster maturation GTPase HydF	74.5	50.9	44.2
MGA_290	LOCUS_02900	sequence1:318936..319520(-)	partial			WP_005794135.1	aminotransferase class IV family protein	59.8	59.1	39.3
MGA_312	LOCUS_03120	sequence1:341470..341736(+)	partial			WP_000346779.1	site-specific DNA-methyltransferase	90.9	22.0	50.0
MGA_324	LOCUS_03240	sequence1:351345..352409(+)	partial			WP_002851370.1	membrane protein	27.7	49.2	33.7
MGA_326	LOCUS_03260	sequence1:352953..354710(+)	partial			WP_012583238.1	type II secretion system ATPase GspE	93.2	63.6	42.3
MGA_328	LOCUS_03280	sequence1:356120..358159(+)	partial			WP_010891893.1	DNA translocase FtsK	81.9	58.6	66.5
MGA_338	LOCUS_03380	sequence1:366637..367146(-)	partial			WP_001106543.1	DNA adenine methylase	98.2	50.5	65.1
MGA_343	LOCUS_03430	sequence1:369935..370294(+)	partial			WP_001235932.1	c-type cytochrome	67.2	60.2	41.2
MGA_357	LOCUS_03570	sequence1:382978..383661(+)	partial			WP_000367546.1	site-specific DNA-methyltransferase	65.6	20.7	42.8
MGA_371	LOCUS_03710	sequence1:399585..400061(-)	partial			WP_000694947.1	WG repeat-containing protein	87.3	43.2	36.7
MGA_412	LOCUS_04120	sequence1:448084..449061(+)	partial			WP_011922118.1	glycosyltransferase family 2 protein	67.4	65.6	36.5
MGA_439	LOCUS_04390	sequence1:479750..480442(-)	partial			WP_002852612.1	serine O-acetyltransferase	73.0	79.7	65.1
MGA_451	LOCUS_04510	sequence1:490902..492098(-)	partial			WP_010891827.1	PD-(D/E)XK nuclease family protein	62.8	61.3	31.3
MGA_473	LOCUS_04730	sequence1:513890..514303(+)	partial			WP_011460328.1	Rrf2 family transcriptional regulator	62.0	58.2	45.9
MGA_483	LOCUS_04830	sequence1:522826..524397(+)	internal_stop_codon	522778..522780(+)		WP_019084281.1	TonB-dependent receptor	99.0	54.5	25.7
MGA_491	LOCUS_04910	sequence1:532296..535670(-)	partial			WP_002826528.1	carbamoyltransferase HypF	47.5	68.6	35.9
MGA_540	LOCUS_05400	sequence1:587615..587989(+)	partial			WP_002852050.1	hypothetical protein	71.0	28.2	43.2
MGA_541	LOCUS_05410	sequence1:587992..588828(+)	internal_stop_codon	588826..588828(+)		WP_011166554.1	DNA recombination protein RmuC	93.9	80.6	30.7
MGA_546	LOCUS_05460	sequence1:595175..595555(-)	partial			WP_002858588.1	ATP-dependent DNA helicase RecG	91.3	19.3	70.1
MGA_553	LOCUS_05530	sequence1:603369..607883(+)	partial			WP_011035898.1	ESPR-type extended signal peptide-containing protein	96.9	60.7	25.1
MGA_555	LOCUS_05550	sequence1:609120..610676(+)	partial			WP_003230755.1	dynamin GTPase	94.2	40.0	22.2
MGA_583	LOCUS_05830	sequence1:639929..640954(+)	partial			WP_002858054.1	UDP-N-acetylglucosamine 4,6-dehydratase (configuration-retaining)	98.2	56.6	62.8
MGA_587	LOCUS_05870	sequence1:642803..643270(+)	partial			WP_002858681.1	serine--tRNA ligase	95.5	35.0	50.0
MGA_597	LOCUS_05970	sequence1:651858..652670(-)	partial			WP_000826792.1	two-component system sensor histidine kinase HprS	88.5	54.4	27.8
MGA_602	LOCUS_06020	sequence1:655040..655453(+)	internal_stop_codon	655451..655453(+)		WP_002858662.1	anthranilate phosphoribosyltransferase	95.6	24.6	53.4
MGA_603	LOCUS_06030	sequence1:655619..656050(+)	internal_stop_codon	655451..655453(+)		WP_002858662.1	anthranilate phosphoribosyltransferase	97.9	26.3	57.1
MGA_607	LOCUS_06070	sequence1:668067..668750(-)	partial			WP_000901420.1	Sel1-like repeat protein HcpA	56.4	50.0	40.6
MGA_637	LOCUS_06370	sequence1:695469..695903(-)	partial			WP_010951099.1	DNA methyltransferase	85.4	16.0	37.6
MGA_639	LOCUS_06390	sequence1:696844..698160(-)	partial			WP_011707115.1	sodium/pantothenate symporter	73.5	70.3	25.1
MGA_676	LOCUS_06760	sequence1:733755..734438(-)	partial			WP_015944691.1	polysaccharide deacetylase family protein	94.7	63.6	34.6
MGA_680	LOCUS_06800	sequence1:737554..738369(-)	partial			WP_011017010.1	polysaccharide deacetylase family protein	84.5	64.2	36.9
MGA_688	LOCUS_06880	sequence1:746477..746686(-)	partial			WP_002853349.1	ribonuclease P protein component	100.0	63.9	43.5
MGA_689	LOCUS_06890	sequence1:746800..746934(-)	partial			WP_002776864.1	50S ribosomal protein L34	72.7	72.7	84.4
MGA_694	LOCUS_06940	sequence1:752015..752395(-)	partial			WP_012545648.1	response regulator	90.5	31.6	41.2
MGA_695	LOCUS_06950	sequence1:752400..756557(-)	partial			WP_011071149.1	PAS domain S-box protein	27.0	21.6	34.7
MGA_700	LOCUS_07000	sequence1:761155..762252(+)	partial			WP_209021411.1	Dam family site-specific DNA-(adenine-N6)-methyltransferase	94.2	47.2	89.8
MGA_703	LOCUS_07030	sequence1:763278..763931(+)	frameshift		763925	WP_027348389.1	AlwI family type II restriction endonuclease	95.9	31.5	69.7
MGA_704	LOCUS_07040	sequence1:763909..764649(+)	frameshift		763925,764646	WP_027348389.1	AlwI family type II restriction endonuclease	98.8	36.8	81.5
MGA_705	LOCUS_07050	sequence1:764613..765149(+)	frameshift		764646	WP_027348389.1	AlwI family type II restriction endonuclease	96.6	25.8	79.7
MGA_710	LOCUS_07100	sequence1:772074..772550(+)	partial			WP_002853189.1	glutamine-hydrolyzing GMP synthase	100.0	30.9	84.2
MGA_711	LOCUS_07110	sequence1:773855..774994(+)	partial			WP_140834638.1	CapA family protein	85.5	72.1	36.0
MGA_734	LOCUS_07340	sequence1:796532..798178(+)	partial			WP_158707352.1	calcium-binding protein	25.2	7.7	44.6
MGA_737	LOCUS_07370	sequence1:799313..800713(+)	partial			WP_158707352.1	calcium-binding protein	34.5	9.1	41.7
MGA_817	LOCUS_08170	sequence1:874755..875849(-)	partial			WP_010941913.1	nitrous oxide reductase accessory protein NosL	36.5	84.4	48.9
MGA_865	LOCUS_08650	sequence1:928008..929057(-)	frameshift		928034,928031	WP_003594382.1	excinuclease ABC subunit UvrA	97.7	46.2	28.7
MGA_868	LOCUS_08680	sequence1:934344..935057(+)	partial			WP_000764034.1	hypothetical protein	85.2	72.9	38.6
MGA_886	LOCUS_08860	sequence1:951252..951833(-)	frameshift		951924	WP_002856709.1	amino acid ABC transporter permease	100.0	77.7	66.3
MGA_921	LOCUS_09200	sequence1:986502..986909(+)	frameshift,internal_stop_codon	986907..986909(+)	986936	WP_010880190.1	type I-B CRISPR-associated endonuclease Cas1b	81.5	35.8	46.9
MGA_922	LOCUS_09210	sequence1:986927..987502(+)	frameshift		986873	WP_008768967.1	type I-B CRISPR-associated endonuclease Cas1b	97.4	54.6	43.0
MGA_927	LOCUS_09240	sequence1:993093..993407(-)	frameshift		993528	WP_003751157.1	phage terminase large subunit	74.0	14.4	41.8
MGA_969	LOCUS_09660	sequence1:1037967..1038134(-)	partial			WP_002858758.1	threonine ammonia-lyase	100.0	13.6	56.4
MGA_980	LOCUS_09770	sequence1:1047327..1047563(-)	frameshift		1047601,1047331	WP_012775600.1	nucleotidyl transferase AbiEii/AbiGii toxin family protein	94.9	26.3	50.0
MGA_981	LOCUS_09780	sequence1:1047593..1047922(-)	frameshift		1047601	WP_011166377.1	nucleotidyl transferase AbiEii/AbiGii toxin family protein	97.2	42.3	29.7
MGA_982	LOCUS_09790	sequence1:1047919..1048251(-)	frameshift		1048252	WP_020862546.1	type IV toxin-antitoxin system AbiEi family antitoxin domain-containing protein	96.4	52.0	33.0
MGA_1000	LOCUS_09970	sequence1:1063186..1070214(-)	partial			WP_201627199.1	autotransporter-associated N-terminal domain-containing protein	73.7	70.8	25.7
MGA_1019	LOCUS_10160	sequence1:1085661..1086560(-)	partial			WP_010989855.1	DNA polymerase IV	68.6	58.7	31.0
MGA_1023	LOCUS_10200	sequence1:1087623..1089677(-)	partial			WP_019561992.1	phage tail protein	38.5	35.3	26.5
MGA_1030	LOCUS_10270	sequence1:1095010..1096602(-)	partial			WP_011104844.1	phage tail tape measure protein	59.1	25.8	34.9
MGA_1046	LOCUS_10430	sequence1:1105642..1106862(+)	partial			WP_000117561.1	phage minor head protein	45.3	68.5	40.6
MGA_1068	LOCUS_10650	sequence1:1120664..1121284(-)	partial			WP_002865738.1	single-stranded DNA-binding protein	51.0	57.4	80.0
MGA_1083	LOCUS_10800	sequence1:1136874..1137386(+)	frameshift		1137380	WP_002851930.1	lipid A/FlgG phosphoethanolamine transferase EptC	97.6	32.6	43.5
MGA_1084	LOCUS_10810	sequence1:1137391..1138167(+)	frameshift		1137380	WP_002851930.1	lipid A/FlgG phosphoethanolamine transferase EptC	99.2	49.4	49.6
MGA_1131	LOCUS_11280	sequence1:1182170..1183855(+)	partial			WP_001096399.1	VirB3 family type IV secretion system protein	92.9	57.5	40.3
MGA_1137	LOCUS_11340	sequence1:1187467..1188678(+)	partial			WP_011264002.1	type IV secretion system protein VirB10	47.6	47.0	45.6
MGA_1150	LOCUS_11470	sequence1:1200294..1206647(+)	partial			WP_011860792.1	DEAD/DEAH box helicase family protein	71.2	49.7	30.9
MGA_1167	LOCUS_11640	sequence1:1217472..1219298(-)	partial			WP_000323332.1	hypothetical protein	48.0	56.6	33.9
MGA_1171	LOCUS_11680	sequence1:1220591..1221007(-)	partial			WP_009874495.1	single-stranded DNA-binding protein	68.1	55.0	50.5
MGA_1175	LOCUS_11720	sequence1:1224794..1225951(+)	partial			WP_011476486.1	site-specific integrase	74.8	80.8	26.2
MGA_1198	LOCUS_11950	sequence1:1250009..1250842(+)	partial			WP_012048382.1	peptidylprolyl isomerase	73.3	70.2	26.9
MGA_1219	LOCUS_12160	sequence1:1262091..1262420(-)	partial			WP_002851214.1	50S ribosomal protein L22	95.4	73.8	81.7
MGA_1231	LOCUS_12280	sequence1:1273787..1274287(-)	partial			WP_012582849.1	hypothetical protein	97.6	69.3	29.2
MGA_1239	LOCUS_12360	sequence1:1280647..1281741(+)	partial			WP_196835716.1	adenine-specific methyltransferase EcoRI family protein	80.2	73.0	39.6
MGA_1240	LOCUS_12370	sequence1:1281752..1282807(+)	partial			WP_196835716.1	adenine-specific methyltransferase EcoRI family protein	88.6	72.3	42.4
MGA_1241	LOCUS_12380	sequence1:1282810..1283901(+)	partial			WP_025163903.1	DUF262 domain-containing protein	38.8	40.9	27.4
MGA_1243	LOCUS_12400	sequence1:1289996..1290265(-)	frameshift		1290010,1289958	WP_003691751.1	very short patch repair endonuclease	93.3	59.3	54.8
MGA_1244	LOCUS_12410	sequence1:1290262..1290726(-)	frameshift,internal_stop_codon	1290743..1290745(-)	1290736	WP_011964363.1	HpaII family restriction endonuclease	100.0	44.0	51.6
MGA_1245	LOCUS_12420	sequence1:1290743..1291165(-)	frameshift,internal_stop_codon	1290739..1290741(-)	1290745	WP_011964363.1	HpaII family restriction endonuclease	67.9	26.1	48.4
MGA_1247	LOCUS_12440	sequence1:1292078..1292344(-)	partial			WP_011964247.1	DNA cytosine methyltransferase	97.7	25.4	62.8
MGA_1255	LOCUS_12520	sequence1:1300035..1300400(-)	frameshift		1300386	WP_002858699.1	YajQ family cyclic di-GMP-binding protein	93.4	68.1	58.4
MGA_1256	LOCUS_12530	sequence1:1300360..1300533(-)	frameshift		1300386	WP_002858699.1	YajQ family cyclic di-GMP-binding protein	84.2	29.4	64.6
MGA_1267	LOCUS_12640	sequence1:1309523..1310497(+)	partial			WP_010891843.1	putative transporter	83.6	70.6	59.4
MGA_1269	LOCUS_12660	sequence1:1311043..1311684(+)	partial			WP_002853271.1	AEC family transporter	95.8	67.7	54.1
MGA_1286	LOCUS_12830	sequence1:1326654..1328447(-)	partial			WP_000273909.1	AAA family ATPase	29.0	33.0	24.8
MGA_1296	LOCUS_12930	sequence1:1337111..1338502(-)	partial			WP_011070793.1	cyclic di-GMP phosphodiesterase PdeB	84.0	48.0	24.2
MGA_1303	LOCUS_13000	sequence1:1345278..1345652(-)	partial			WP_003140884.1	TM2 domain-containing protein	50.0	48.6	48.4
MGA_1319	LOCUS_13160	sequence1:1360008..1360880(-)	partial			WP_002853219.1	two-component system sensor histidine kinase DccS	81.7	58.8	31.4
MGA_1323	LOCUS_13200	sequence1:1363107..1364147(-)	frameshift		1364149	WP_000028230.1	thiosulfate reductase PhsA	98.6	44.7	38.1
MGA_1324	LOCUS_13210	sequence1:1364147..1365382(-)	frameshift		1364200,1364148	WP_011073774.1	thiosulfate reductase PhsA	95.9	52.5	45.1
MGA_1335	LOCUS_13320	sequence1:1377552..1377806(-)	partial			WP_001121932.1	KpsF/GutQ family sugar-phosphate isomerase	97.6	24.6	40.2
MGA_1336	LOCUS_13330	sequence1:1378043..1378621(-)	frameshift		1378738,1378719	WP_002852272.1	class II fructose-bisphosphate aldolase	91.1	49.4	76.0
MGA_1351	LOCUS_13480	sequence1:1393960..1394907(+)	partial			WP_008761173.1	DUF3137 domain-containing protein	63.2	60.3	29.1
MGA_1358	LOCUS_13550	sequence1:1403054..1403827(+)	partial			WP_011837081.1	ABC transporter substrate-binding protein/permease	91.1	30.2	27.5
MGA_1374	LOCUS_13710	sequence1:1427983..1428546(-)	partial			WP_002853050.1	c-type cytochrome	62.0	79.9	31.6
MGA_1391	LOCUS_13880	sequence1:1441115..1442293(-)	partial			WP_010943428.1	cytochrome c family protein	64.3	51.4	25.7
MGA_1450	LOCUS_14470	sequence1:1506546..1506893(-)	partial			WP_000345576.1	protein-disulfide oxidoreductase DsbI	86.1	44.4	38.6
MGA_1464	LOCUS_14610	sequence1:1519284..1520930(+)	partial			WP_002851181.1	DNA primase	81.0	73.7	47.9
MGA_1506	LOCUS_15030	sequence1:1556101..1557165(+)	partial			WP_013095459.1	phosphatidylglycerol--membrane-oligosaccharide glycerophosphotransferase	86.4	40.4	34.2
MGA_1522	LOCUS_15190	sequence1:1573668..1573883(-)	frameshift		1573676	WP_000796568.1	heavy metal translocating P-type ATPase	90.1	8.1	51.6
MGA_1527	LOCUS_15240	sequence1:1580956..1588305(+)	partial			WP_014206787.1	hemagglutinin repeat-containing protein	14.9	8.1	33.2
MGA_1531	LOCUS_15280	sequence1:1590030..1591304(+)	partial			WP_210043352.1	deaminase domain-containing protein	60.8	5.3	34.3
MGA_1563	LOCUS_15600	sequence1:1616686..1618167(-)	partial			WP_002673213.1	membrane protein	48.9	70.0	22.6
MGA_1587	LOCUS_15840	sequence1:1641802..1642947(+)	partial			WP_012583970.1	glycosyltransferase family 4 protein	52.2	52.7	26.3
MGA_1589	LOCUS_15860	sequence1:1643803..1644249(+)	partial			WP_000703236.1	glycosyltransferase family 4 protein	98.0	38.5	56.6
MGA_1596	LOCUS_15930	sequence1:1648842..1649540(-)	partial			WP_010622329.1	Rha family transcriptional regulator	73.7	69.1	37.2
MGA_1613	LOCUS_16100	sequence1:1665084..1666571(+)	partial			WP_010895998.1	penicillin-binding protein 1B	82.8	64.1	28.6
MGA_1616	LOCUS_16130	sequence1:1669625..1676362(-)	partial			WP_010980934.1	iron-regulated protein FrpC	33.2	43.7	30.6
MGA_1617	LOCUS_16140	sequence1:1676559..1679951(-)	partial			WP_158707352.1	calcium-binding protein	35.0	19.5	30.4
MGA_1619	LOCUS_16160	sequence1:1680954..1682987(-)	partial			WP_149323728.1	calcium-binding protein	16.7	8.4	39.7
MGA_1624	LOCUS_16210	sequence1:1685873..1686835(-)	partial			WP_010980934.1	iron-regulated protein FrpC	33.4	5.7	40.4
MGA_1639	LOCUS_16360	sequence1:1703068..1703895(+)	internal_stop_codon	1703893..1703895(+)		WP_015064796.1	virulence RhuM family protein	99.3	77.9	52.5
MGA_1647	LOCUS_16440	sequence1:1707112..1707621(+)	partial			WP_011336918.1	terminase large subunit	83.4	25.0	33.3
