# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_1	LOCUS_00010	sequence1:81..305(-)	frameshift		312,415,75,397,111	WP_010948443.1	lpg2745 family Dot/Icm T4SS effector	90.5	10.2	95.5
MGA_2	LOCUS_00020	sequence1:305..508(-)	frameshift		414,311,74,396,669,110	WP_010948443.1	lpg2745 family Dot/Icm T4SS effector	100.0	10.2	91.0
MGA_3	LOCUS_00030	sequence1:908..1195(-)	frameshift		1296,848,829,667,909	WP_010948443.1	lpg2745 family Dot/Icm T4SS effector	100.0	14.5	98.9
MGA_7	LOCUS_00060	sequence1:7860..8240(-)	frameshift		8272	WP_010946060.1	4-hydroxythreonine-4-phosphate dehydrogenase PdxA	100.0	38.9	99.2
MGA_8	LOCUS_00070	sequence1:8228..8560(-)	frameshift		8649,8271	WP_010946060.1	4-hydroxythreonine-4-phosphate dehydrogenase PdxA	87.3	29.6	100.0
MGA_9	LOCUS_00080	sequence1:8632..8832(-)	frameshift		8649	WP_010946060.1	4-hydroxythreonine-4-phosphate dehydrogenase PdxA	95.5	19.4	100.0
MGA_10	LOCUS_00090	sequence1:9098..9319(-)	frameshift		9105,9027,8883,9012,9351	WP_015444876.1	peptidylprolyl isomerase	95.9	16.3	98.6
MGA_11	LOCUS_00100	sequence1:9340..9603(-)	frameshift		9840,9747,9620,9349,9351,9695,9103	WP_015444876.1	peptidylprolyl isomerase	96.6	19.6	79.8
MGA_12	LOCUS_00110	sequence1:9817..9945(-)	frameshift,internal_stop_codon	9955..9957(-)	9840,10049,9747,9620,9994,9695	WP_015444876.1	peptidylprolyl isomerase	83.3	8.2	100.0
MGA_13	LOCUS_00120	sequence1:10429..10674(-)	frameshift,internal_stop_codon	10816..10818(-)	10950,10439,10665,10794,10412,10704,10935,10394	WP_016356722.1	LPS-assembly protein LptD	92.6	8.9	100.0
MGA_14	LOCUS_00130	sequence1:10985..11248(-)	frameshift,internal_stop_codon	10810..10812(-)	10944,10788,11367,11241,10698,11307,11469,10929,10971,11007	WP_016356722.1	LPS-assembly protein LptD	88.5	9.2	100.0
MGA_15	LOCUS_00140	sequence1:11596..12009(-)	frameshift		11363,11636,11303,11654,11591,12104,11465	WP_016356722.1	LPS-assembly protein LptD	86.1	14.1	100.0
MGA_16	LOCUS_00150	sequence1:12048..12479(-)	frameshift		12698,12101,12485,12638	WP_016356722.1	LPS-assembly protein LptD	87.4	14.9	99.2
MGA_18	LOCUS_00170	sequence1:14646..15092(-)	frameshift		14728,15118	WP_010946055.1	lpg0294 family Dot/Icm T4SS effector	82.4	53.0	98.4
MGA_19	LOCUS_00180	sequence1:15068..15376(-)	frameshift		15118	WP_010946055.1	lpg0294 family Dot/Icm T4SS effector	89.2	39.6	96.7
MGA_20	LOCUS_00190	sequence1:15490..15705(-)	frameshift		15704	WP_010946054.1	acyl-CoA dehydrogenase	100.0	8.7	88.7
MGA_54	LOCUS_00530	sequence1:57094..57279(+)	internal_stop_codon	57061..57063(+)		WP_010946237.1	GIY-YIG nuclease family protein	100.0	63.5	98.4
MGA_126	LOCUS_01250	sequence1:149642..150214(+)	partial			WP_010945947.1	ABC transporter permease	100.0	60.7	97.9
MGA_168	LOCUS_01670	sequence1:188516..188809(+)	frameshift		188779	WP_102990622.1	IS3 family transposase	90.7	22.5	92.0
MGA_169	LOCUS_01680	sequence1:188869..189690(+)	frameshift		188779	WP_102990622.1	IS3 family transposase	100.0	69.8	99.3
MGA_253	LOCUS_02520	sequence1:298758..299039(-)	partial			WP_010946820.1	tyrosine-type recombinase/integrase	94.6	21.3	69.3
MGA_276	LOCUS_02750	sequence1:319346..319702(-)	partial			WP_025862422.1	transporter suffix domain-containing protein	100.0	73.8	100.0
MGA_298	LOCUS_02970	sequence1:344717..345274(-)	partial			WP_014840688.1	hypothetical protein	100.0	59.7	100.0
MGA_311	LOCUS_03100	sequence1:362153..362821(-)	partial			WP_010945765.1	DNA replication/repair protein RecF	100.0	62.9	99.5
MGA_371	LOCUS_03700	sequence1:429734..430204(+)	partial			WP_011390771.1	lasso peptide biosynthesis B2 protein	34.6	36.2	41.8
MGA_390	LOCUS_03890	sequence1:448498..448797(-)	partial			WP_010948615.1	twin-arginine translocase subunit TatC	100.0	41.1	100.0
MGA_417	LOCUS_04160	sequence1:476406..476591(-)	partial			WP_003095893.1	twin-arginine translocase TatA/TatE family subunit	70.5	50.0	58.1
MGA_472	LOCUS_04710	sequence1:533433..534359(+)	partial			WP_010948541.1	tetratricopeptide repeat protein	40.9	40.9	100.0
MGA_482	LOCUS_04810	sequence1:545334..546407(+)	partial			WP_010948531.1	lpg2844 family Dot/Icm T4SS effector	40.1	39.6	89.5
MGA_568	LOCUS_05670	sequence1:656217..657608(-)	partial			WP_010948448.1	sulfatase-like hydrolase/transferase	100.0	69.6	100.0
MGA_604	LOCUS_06010	sequence1:696742..696954(-)	partial			WP_010948415.1	DUF167 domain-containing protein	100.0	73.7	100.0
MGA_606	LOCUS_06030	sequence1:699630..700019(+)	partial			WP_011216580.1	translation initiation factor IF-3	100.0	72.5	96.9
MGA_607	LOCUS_06040	sequence1:700040..700240(+)	partial			WP_005596065.1	50S ribosomal protein L35	68.2	69.2	68.9
MGA_631	LOCUS_06280	sequence1:724252..725076(+)	partial			WP_010948390.1	protein LphB	100.0	49.7	86.9
MGA_634	LOCUS_06310	sequence1:727219..727524(+)	partial			WP_010948387.1	type IVB secretion system protein IcmV	100.0	66.9	89.1
MGA_675	LOCUS_06720	sequence1:770743..770979(+)	frameshift		770949	WP_011216518.1	UvrY/SirA/GacA family response regulator transcription factor	98.7	35.2	93.5
MGA_676	LOCUS_06730	sequence1:770928..771401(+)	frameshift		770949	WP_011216518.1	UvrY/SirA/GacA family response regulator transcription factor	95.5	68.5	100.0
MGA_755	LOCUS_07520	sequence1:865713..866558(-)	frameshift		866566	WP_223804314.1	IS3-like element ISLpn8 family transposase	100.0	76.2	99.6
MGA_756	LOCUS_07530	sequence1:866555..866821(-)	frameshift		866566	WP_223804314.1	IS3-like element ISLpn8 family transposase	98.9	23.6	98.9
MGA_763	LOCUS_07600	sequence1:872309..872737(-)	partial			WP_025385041.1	site-specific integrase	100.0	34.3	78.9
MGA_879	LOCUS_08760	sequence1:1004168..1004605(+)	partial			WP_198265214.1	IS5 family transposase	92.4	56.8	73.1
MGA_880	LOCUS_08770	sequence1:1004635..1004820(+)	partial			WP_010946237.1	GIY-YIG nuclease family protein	100.0	63.5	96.7
MGA_949	LOCUS_09460	sequence1:1080702..1081280(-)	frameshift		1081287	WP_058498129.1	lpg2370 family Dot/Icm T4SS effector	100.0	61.9	90.7
MGA_950	LOCUS_09470	sequence1:1081270..1081620(-)	frameshift		1081287	WP_027224428.1	HipA domain-containing protein	95.7	35.8	97.3
MGA_951	LOCUS_09480	sequence1:1081617..1081784(-)	frameshift		1081755	WP_010948073.1	HipA N-terminal domain-containing protein	90.9	49.0	96.0
MGA_959	LOCUS_09560	sequence1:1085286..1085951(+)	partial			WP_014844527.1	hypothetical protein	48.0	32.3	62.3
MGA_1130	LOCUS_11260	sequence1:1276032..1276304(-)	partial			WP_010947914.1	hypothetical protein	100.0	42.5	94.4
MGA_1133	LOCUS_11290	sequence1:1280059..1280391(+)	partial			WP_162839581.1	archease	100.0	74.8	100.0
MGA_1137	LOCUS_11330	sequence1:1283327..1284031(-)	partial			WP_015444184.1	oligopeptide:H+ symporter	100.0	46.8	96.2
MGA_1284	LOCUS_12790	sequence1:1473269..1473568(-)	partial			WP_010947765.1	hypothetical protein	56.6	56.6	100.0
MGA_1326	LOCUS_13210	sequence1:1514821..1515024(+)	partial			WP_002116990.1	DNA-directed RNA polymerase subunit omega	98.5	71.7	72.7
MGA_1364	LOCUS_13590	sequence1:1551832..1552077(+)	frameshift,internal_stop_codon	1551797..1551799(+)	1551826	WP_040534536.1	IS5 family transposase	60.5	19.7	65.3
MGA_1438	LOCUS_14330	sequence1:1644464..1645627(-)	partial			WP_010947617.1	DUF3488 and transglutaminase-like domain-containing protein	100.0	58.5	100.0
MGA_1752	LOCUS_17470	sequence1:2021210..2021401(+)	partial			WP_005768810.1	succinate dehydrogenase assembly factor 2	77.8	59.8	46.9
MGA_1981	LOCUS_19760	sequence1:2276174..2276980(+)	partial			WP_010947079.1	apolipoprotein N-acyltransferase	100.0	52.4	97.4
MGA_2007	LOCUS_20010	sequence1:2306103..2306918(+)	partial			WP_010947054.1	legiobactin import MFS transporter LbtC	100.0	70.2	93.7
MGA_2064	LOCUS_20580	sequence1:2369609..2370220(-)	partial			WP_010655106.1	HD domain-containing protein	99.5	64.5	63.0
MGA_2070	LOCUS_20640	sequence1:2373663..2374715(+)	partial			WP_010946996.1	oligopeptide:H+ symporter	100.0	70.7	97.1
MGA_2133	LOCUS_21270	sequence1:2435677..2435973(+)	partial			WP_011036977.1	YerC/YecD family TrpR-related protein	80.6	73.1	55.7
MGA_2190	LOCUS_21840	sequence1:2505862..2506335(+)	partial			WP_010946878.1	Dot/Icm T4SS effector CegC3	68.8	64.3	94.4
MGA_2247	LOCUS_22410	sequence1:2576350..2576739(-)	partial			WP_010946824.1	hypothetical protein	100.0	74.6	100.0
MGA_2265	LOCUS_22590	sequence1:2597441..2597716(+)	partial			WP_010945905.1	ISL3 family transposase	100.0	23.3	100.0
MGA_2300	LOCUS_22940	sequence1:2626339..2626506(+)	partial			WP_072363891.1	CHASE3 domain-containing protein	100.0	69.6	98.2
MGA_2322	LOCUS_23160	sequence1:2655475..2655708(-)	frameshift		2655576	WP_058460933.1	cation-translocating P-type ATPase	70.1	6.0	77.8
MGA_2326	LOCUS_23200	sequence1:2657666..2658196(-)	internal_stop_codon	2658290..2658292(-)		WP_010655421.1	SDR family oxidoreductase	100.0	66.4	98.3
MGA_2327	LOCUS_23210	sequence1:2658290..2658463(-)	internal_stop_codon	2658290..2658292(-)		WP_115222831.1	SDR family oxidoreductase	100.0	21.5	96.5
MGA_2338	LOCUS_23320	sequence1:2670846..2671100(-)	partial			WP_045096252.1	XRE family transcriptional regulator	88.1	33.0	48.0
MGA_2377	LOCUS_23710	sequence1:2705202..2706605(-)	partial			WP_010946701.1	nucleoside-diphosphate sugar epimerase/dehydratase	100.0	74.7	98.1
MGA_2378	LOCUS_23720	sequence1:2707134..2707922(-)	partial			WP_032828678.1	hypothetical protein	100.0	52.2	98.5
MGA_2547	LOCUS_25410	sequence1:2894843..2895451(-)	frameshift		2895485	WP_223804314.1	IS3-like element ISLpn8 family transposase	79.7	43.6	91.3
MGA_2548	LOCUS_25420	sequence1:2895465..2895788(-)	frameshift		2895490,2895814	WP_223804314.1	IS3-like element ISLpn8 family transposase	94.4	27.4	89.1
MGA_2549	LOCUS_25430	sequence1:2895809..2896075(-)	frameshift		2895814	WP_223804314.1	IS3-like element ISLpn8 family transposase	98.9	23.6	90.8
MGA_2554	LOCUS_25480	sequence1:2901432..2901860(-)	partial			WP_011213316.1	DUF1574 family protein	100.0	36.6	100.0
MGA_2561	LOCUS_25550	sequence1:2908627..2910027(+)	partial			WP_010946519.1	acyltransferase family protein	100.0	70.6	99.1
MGA_2697	LOCUS_26910	sequence1:3072392..3076681(-)	frameshift		3076722	WP_070065546.1	enhanced entry virulence factor RtxA	100.0	22.3	95.7
MGA_2698	LOCUS_26920	sequence1:3076678..3080280(-)	frameshift		3080266,3076722	WP_070065546.1	enhanced entry virulence factor RtxA	98.4	18.4	90.5
MGA_2699	LOCUS_26930	sequence1:3080210..3080620(-)	frameshift		3080640,3080265,3080268,3080637	WP_070065546.1	enhanced entry virulence factor RtxA	86.8	1.8	82.2
MGA_2700	LOCUS_26940	sequence1:3080635..3087894(-)	frameshift		3080640,3080643,3080637	WP_070065546.1	enhanced entry virulence factor RtxA	100.0	37.7	92.2
MGA_2723	LOCUS_27170	sequence1:3115460..3116056(+)	partial			WP_010946359.1	membrane protein	100.0	30.6	100.0
MGA_2786	LOCUS_27790	sequence1:3179177..3179677(+)	partial			WP_015444791.1	lysophospholipid acyltransferase family protein	100.0	68.3	100.0
MGA_2828	LOCUS_28210	sequence1:3225690..3226253(-)	partial			WP_015444807.1	phosphatidate cytidylyltransferase	100.0	70.6	99.5
MGA_2845	LOCUS_28380	sequence1:3243136..3243570(-)	partial			WP_198265214.1	IS5 family transposase	98.6	60.2	73.9
MGA_2891	LOCUS_28840	sequence1:3293494..3294270(+)	partial			WP_010946188.1	Dot/Icm T4SS effector Ceg15	100.0	73.9	100.0
MGA_3025	LOCUS_30160	sequence1:3424747..3425193(+)	frameshift		3425160	WP_010946051.1	patatin-like phospholipase family protein	93.2	34.4	94.2
MGA_3026	LOCUS_30170	sequence1:3425160..3425951(+)	frameshift		3425154	WP_010946051.1	patatin-like phospholipase family protein	100.0	65.6	99.6
MGA_3027	LOCUS_30180	sequence1:3425992..3426417(+)	frameshift		3426609,3426627,3426309	WP_015444881.1	polyphosphate kinase 1	83.0	17.0	93.2
MGA_3028	LOCUS_30190	sequence1:3426315..3426908(+)	frameshift		3426609,3426627,3426309,3427063,3427195,3427117,3426814	WP_015444881.1	polyphosphate kinase 1	87.8	25.1	93.1
MGA_3029	LOCUS_30200	sequence1:3426809..3427135(+)	frameshift		3427392,3426626,3427266,3427116,3426608,3427062,3427194,3426813	WP_015444881.1	polyphosphate kinase 1	77.8	12.2	98.8
MGA_3030	LOCUS_30210	sequence1:3427719..3427928(+)	frameshift		3427936,3427906,3427430,3427750,3427529,3427786,3427499,3427472,3427665,3427924	WP_015444881.1	polyphosphate kinase 1	66.7	6.8	78.7
MGA_3032	LOCUS_30220	sequence2:238..771(+)	frameshift		392,203,908,911,404,410,59,731	WP_070065546.1	enhanced entry virulence factor RtxA	92.1	2.6	92.1
MGA_3033	LOCUS_30230	sequence2:768..908(+)	frameshift,internal_stop_codon	1108..1110(+)	726,903,906,1086	WP_070065546.1	enhanced entry virulence factor RtxA	67.4	0.5	96.8
MGA_3036	LOCUS_30260	sequence2:1365..1643(+)	frameshift,internal_stop_codon	1106..1108(+)	1605,1366,1606,1365,1725,1726,1087	WP_070065546.1	enhanced entry virulence factor RtxA	87.0	1.2	81.2
MGA_3037	LOCUS_30270	sequence2:1738..2298(+)	frameshift		1604,2297,1724	WP_070065546.1	enhanced entry virulence factor RtxA	100.0	2.9	93.5
MGA_3038	LOCUS_30280	sequence2:2295..17402(+)	frameshift		2295	WP_070065546.1	enhanced entry virulence factor RtxA	100.0	78.4	91.5
MGA_3039	LOCUS_30290	sequence2:17581..18024(+)	frameshift		17856,18100	WP_010946383.1	NAD(P)H:quinone oxidoreductase	62.6	46.2	100.0
MGA_3040	LOCUS_30300	sequence2:17936..18118(+)	frameshift		17853,18103	WP_010946383.1	NAD(P)H:quinone oxidoreductase	95.0	28.6	98.2
MGA_3041	LOCUS_30310	sequence2:18297..18515(+)	frameshift		18561,18494	WP_010947893.1	IS4-like element ISLpn6 family transposase	91.7	14.1	100.0
MGA_3043	LOCUS_30330	sequence2:18687..19130(+)	frameshift		18561,19050,19398,18494	WP_010946384.1	IS4-like element ISLpn6 family transposase	87.1	27.4	94.5
MGA_3044	LOCUS_30340	sequence2:19157..19462(+)	frameshift		19049,19397	WP_010946384.1	IS4-like element ISLpn6 family transposase	81.2	17.5	97.6
MGA_3045	LOCUS_30350	sequence2:19440..19703(+)	frameshift		19396	WP_010946384.1	IS4-like element ISLpn6 family transposase	100.0	18.6	94.3
MGA_3050	LOCUS_30390	sequence3:3961..4782(-)	frameshift		4871	WP_102990622.1	IS3 family transposase	100.0	69.8	99.3
MGA_3051	LOCUS_30400	sequence3:4842..5135(-)	frameshift		4871	WP_102990622.1	IS3 family transposase	90.7	22.5	92.0
MGA_3053	LOCUS_30420	sequence3:5617..5817(+)	frameshift		6042,5814	WP_010945909.1	hypothetical protein	100.0	14.5	100.0
MGA_3054	LOCUS_30430	sequence3:5865..6086(+)	frameshift		6042,5814	WP_010945909.1	hypothetical protein	80.8	12.9	100.0
MGA_3055	LOCUS_30440	sequence3:6077..6985(+)	frameshift		6042,5814	WP_010945909.1	hypothetical protein	100.0	66.2	99.7
MGA_3056	LOCUS_30450	sequence3:7117..7878(-)	frameshift		7927,7928,7930,8044,8047	WP_010945910.1	hypothetical protein	100.0	56.7	98.4
MGA_3057	LOCUS_30460	sequence3:8572..8844(-)	frameshift		8552,8810,8949,8591	WP_010945911.1	P-loop NTPase fold protein	81.1	16.0	100.0
MGA_3058	LOCUS_30470	sequence3:8905..9840(-)	frameshift		8810,8949	WP_010945911.1	P-loop NTPase fold protein	95.5	65.1	98.3
MGA_3059	LOCUS_30480	sequence3:10042..10833(+)	frameshift		10824	WP_010945912.1	PIN domain-containing protein	99.2	73.7	100.0
MGA_3060	LOCUS_30490	sequence3:10802..11107(+)	frameshift		10824	WP_010945912.1	PIN domain-containing protein	96.0	27.4	97.9
MGA_3061	LOCUS_30500	sequence3:11703..11909(+)	frameshift		11897,12116	WP_010945913.1	GNAT family N-acetyltransferase	95.6	38.0	98.5
