# locus_id	locus_tag	location	classification	internal_stop	indel	ref_id	description	query_cov	ref_cov	identity
MGA_76	LOCUS_00630	sequence14:11303..11638(-)	partial			WP_031588332.1	recombinase family protein	100.0	55.8	99.1
MGA_85	LOCUS_00700	sequence17:1..781(+)	partial			WP_011082576.1	accumulation-associated protein Aap	87.3	15.7	54.5
MGA_87	LOCUS_00720	sequence17:2402..2572(+)	partial			WP_001795286.1	hypothetical protein	100.0	72.7	92.9
MGA_95	LOCUS_00800	sequence17:10835..11947(+)	frameshift		11866	WP_001044255.1	membrane protein	93.0	78.0	87.5
MGA_96	LOCUS_00810	sequence17:11878..12159(+)	frameshift		11863	WP_001044255.1	membrane protein	100.0	21.1	96.8
MGA_104	LOCUS_00890	sequence17:16633..16842(+)	frameshift		16764	WP_001034758.1	DUF1433 domain-containing protein	58.0	28.6	80.0
MGA_105	LOCUS_00900	sequence17:16854..17057(+)	frameshift		16764	WP_001034758.1	DUF1433 domain-containing protein	100.0	47.9	100.0
MGA_194	LOCUS_01790	sequence17:112871..113077(-)	internal_stop_codon	113147..113149(-)		WP_000276759.1	DUF2268 domain-containing protein	100.0	22.4	100.0
MGA_195	LOCUS_01800	sequence17:113147..113785(-)	internal_stop_codon	113147..113149(-)		WP_000276759.1	DUF2268 domain-containing protein	100.0	69.7	99.1
MGA_224	LOCUS_02090	sequence17:144979..145155(-)	internal_stop_codon	144979..144981(-)		WP_126475239.1	IS1182 family transposase	100.0	10.6	98.3
MGA_271	LOCUS_02560	sequence17:191760..192074(-)	frameshift		191876	WP_126475239.1	IS1182 family transposase	81.7	14.7	72.9
MGA_366	LOCUS_03500	sequence17:271926..273023(+)	frameshift		271696,273020,271822	WP_011202675.1	DEAD/DEAH box helicase family protein	100.0	24.7	33.1
MGA_367	LOCUS_03510	sequence17:273020..273313(+)	frameshift		273020	WP_010939452.1	DEAD/DEAH box helicase family protein	96.9	6.1	47.4
MGA_370	LOCUS_03540	sequence17:274540..275274(+)	partial			WP_009873568.1	AAA family ATPase	82.0	27.0	30.3
MGA_416	LOCUS_03970	sequence22:11531..11884(-)	partial			WP_001801792.1	ATP synthase subunit I	83.8	65.3	98.0
MGA_454	LOCUS_04350	sequence22:50247..50450(-)	frameshift,internal_stop_codon	50247..50249(-)	50427	WP_010925589.1	recombinase family protein	86.6	53.6	73.3
MGA_500	LOCUS_04800	sequence23:38978..39733(+)	frameshift		39571	WP_000184370.1	transglycosylase domain-containing protein	78.9	65.8	94.9
MGA_501	LOCUS_04810	sequence23:39682..39882(+)	frameshift		39571	WP_000184370.1	transglycosylase domain-containing protein	100.0	21.9	98.5
MGA_509	LOCUS_04890	sequence23:52356..53396(-)	partial			WP_000193903.1	hypothetical protein	84.1	62.4	73.2
MGA_534	LOCUS_05140	sequence23:87528..87752(-)	frameshift		87580,87775	WP_126475239.1	IS1182 family transposase	78.4	12.3	82.1
MGA_535	LOCUS_05150	sequence23:87749..88240(-)	frameshift		87579,88188,87774	WP_126475239.1	IS1182 family transposase	84.7	25.3	94.2
MGA_560	LOCUS_05360	sequence27:1..534(+)	partial			WP_001181101.1	replication initiator protein A	100.0	55.0	95.0
MGA_595	LOCUS_05710	sequence28:24526..24903(-)	frameshift		25069	WP_000149064.1	cell wall-active antibiotics response protein LiaF	100.0	53.6	100.0
MGA_661	LOCUS_06370	sequence28:93161..93508(+)	frameshift		93376,93099	WP_000179343.1	tyrosine-type recombinase/integrase	100.0	29.7	54.2
MGA_665	LOCUS_06410	sequence28:96649..97908(-)	partial			WP_000120296.1	SdrH family protein	53.9	54.5	95.1
MGA_698	LOCUS_06720	sequence31:3271..3492(-)	frameshift,internal_stop_codon	3705..3707(-)	3500	WP_001832700.1	IS200/IS605-like element ISSep3 family transposase	87.7	40.0	100.0
MGA_700	LOCUS_06740	sequence31:4498..4788(-)	frameshift		4844	WP_011117535.1	replication initiation factor domain-containing protein	99.0	31.0	63.2
MGA_701	LOCUS_06750	sequence31:4773..5258(-)	frameshift		4844	WP_011117535.1	replication initiation factor domain-containing protein	89.4	49.0	73.3
MGA_702	LOCUS_06760	sequence31:5631..5825(-)	partial			WP_000469833.1	XRE family transcriptional regulator	100.0	16.4	98.4
MGA_723	LOCUS_06970	sequence31:27097..27438(-)	partial			WP_000414629.1	MFS transporter	100.0	54.3	98.2
MGA_742	LOCUS_07160	sequence31:48759..49874(-)	internal_stop_codon	49902..49904(-)		WP_003244019.1	PLP-dependent aminotransferase family protein	100.0	77.0	37.2
MGA_743	LOCUS_07170	sequence31:49902..50156(-)	partial			WP_000577184.1	GntR family transcriptional regulator	94.0	34.9	40.7
MGA_770	LOCUS_07440	sequence31:81508..81960(+)	partial			WP_001827266.1	tRNA-dihydrouridine synthase	100.0	48.4	96.0
MGA_796	LOCUS_07700	sequence31:118719..118856(+)	partial			WP_000240855.1	50S ribosomal protein L34	60.0	60.0	100.0
MGA_808	LOCUS_07820	sequence31:127432..127782(-)	partial			WP_002305939.1	IS30 family transposase	89.7	32.6	69.2
MGA_810	LOCUS_07840	sequence31:128418..128783(-)	partial			WP_002305939.1	IS30 family transposase	86.8	32.9	68.6
MGA_840	LOCUS_08140	sequence31:156262..157020(+)	frameshift		157005	WP_000592610.1	imidazole glycerol phosphate synthase subunit HisF	98.4	53.7	100.0
MGA_841	LOCUS_08150	sequence31:157017..157649(+)	frameshift		157002	WP_000592610.1	imidazole glycerol phosphate synthase subunit HisF	100.0	45.5	100.0
MGA_842	LOCUS_08160	sequence31:157809..158021(+)	partial			WP_000837587.1	hypothetical protein	64.3	76.3	95.6
MGA_860	LOCUS_08340	sequence31:175373..175897(-)	internal_stop_codon	175907..175909(-),175373..175375(-)		WP_002485492.1	hypothetical protein	98.3	42.4	39.6
MGA_861	LOCUS_08350	sequence31:175907..176185(-)	internal_stop_codon	175907..175909(-),176273..176275(-),176363..176365(-),176189..176191(-)		WP_002485492.1	hypothetical protein	95.7	19.6	41.7
MGA_862	LOCUS_08360	sequence31:176363..177163(-)	internal_stop_codon	176273..176275(-),177365..177367(-),177443..177445(-),177173..177175(-),176363..176365(-),176189..176191(-),177263..177265(-)		WP_002485492.1	hypothetical protein	99.2	50.8	40.7
MGA_863	LOCUS_08370	sequence31:177443..178651(-)	internal_stop_codon	177443..177445(-),178775..178777(-),177365..177367(-),177263..177265(-)		WP_002485492.1	hypothetical protein	99.0	73.8	38.0
MGA_864	LOCUS_08380	sequence31:178775..179539(-)	internal_stop_codon	179627..179629(-),179690..179692(-),179633..179635(-),178775..178777(-)		WP_002485492.1	hypothetical protein	63.0	29.8	34.1
MGA_865	LOCUS_08390	sequence31:179520..179891(+)	partial			WP_000044547.1	serine-rich repeat glycoprotein adhesin SasA	55.3	3.0	92.6
MGA_889	LOCUS_08630	sequence31:214219..216651(+)	frameshift		216381	WP_000745891.1	MSCRAMM family adhesin clumping factor ClfB	68.1	62.9	97.6
MGA_906	LOCUS_08800	sequence31:236708..237394(+)	partial			WP_003894962.1	MBL fold metallo-hydrolase	61.4	67.3	30.8
MGA_946	LOCUS_09200	sequence31:275059..275379(-)	partial			WP_001795157.1	hypothetical protein	100.0	63.9	99.1
MGA_994	LOCUS_09680	sequence31:328838..329344(-)	frameshift		328870	WP_000773921.1	ATP-binding cassette domain-containing protein	93.5	74.4	91.1
MGA_1008	LOCUS_09820	sequence31:342110..342574(+)	partial			WP_011948695.1	MarR family transcriptional regulator	85.1	73.0	38.2
MGA_1022	LOCUS_09960	sequence31:361653..361862(+)	frameshift		361512	WP_000794614.1	fibronectin-binding protein FnbA	100.0	6.6	94.2
MGA_1065	LOCUS_10360	sequence33:42593..43837(+)	partial			WP_011026975.1	lanthionine synthetase C family protein	75.1	69.1	24.1
MGA_1066	LOCUS_10370	sequence33:43853..44371(+)	partial			WP_010880496.1	bifunctional phosphopantothenoylcysteine decarboxylase/phosphopantothenate--cysteine ligase CoaBC	77.9	35.3	38.0
MGA_1067	LOCUS_10380	sequence33:44381..45754(+)	partial			WP_000699969.1	S8 family serine peptidase	69.1	55.1	38.9
MGA_1077	LOCUS_10480	sequence33:54122..54397(+)	partial			WP_001038752.1	serine protease SplF	70.3	26.8	98.4
MGA_1078	LOCUS_10490	sequence33:54286..54693(+)	partial			WP_001038752.1	serine protease SplF	90.4	51.0	100.0
MGA_1080	LOCUS_10500	sequence33:55507..56307(+)	partial			WP_001793440.1	type I restriction-modification system subunit M	90.2	41.5	100.0
MGA_1082	LOCUS_10520	sequence33:58349..62461(+)	partial			WP_011391500.1	hypothetical protein	48.8	43.2	26.4
MGA_1083	LOCUS_10530	sequence33:62981..63358(+)	partial			WP_010989411.1	DUF1433 domain-containing protein	74.4	66.9	44.1
MGA_1084	LOCUS_10540	sequence33:64228..64371(+)	frameshift,internal_stop_codon	64369..64371(+)	64380	WP_000159787.1	transposase	89.4	46.7	76.2
MGA_1142	LOCUS_11120	sequence34:42529..42819(-)	frameshift		42919	WP_000540323.1	tandem-type lipoprotein	100.0	36.1	95.8
MGA_1143	LOCUS_11130	sequence34:42893..43351(-)	frameshift		42922	WP_001802016.1	tandem-type lipoprotein	92.8	52.2	86.5
MGA_1146	LOCUS_11160	sequence34:45199..45576(-)	frameshift		45617	WP_000540323.1	tandem-type lipoprotein	99.2	47.0	84.8
MGA_1147	LOCUS_11170	sequence34:45573..45977(-)	frameshift		45590	WP_001557594.1	tandem-type lipoprotein	95.5	50.2	66.4
MGA_1149	LOCUS_11190	sequence34:46845..47063(-)	frameshift		46904,47187	WP_001557596.1	tandem-type lipoprotein	98.6	26.2	78.9
MGA_1150	LOCUS_11200	sequence34:47179..47652(-)	frameshift		46904,47187	WP_001557596.1	tandem-type lipoprotein	88.5	51.9	83.5
MGA_1156	LOCUS_11260	sequence34:52646..53248(-)	frameshift		53334	WP_000072584.1	restriction endonuclease subunit S	100.0	49.6	98.0
MGA_1157	LOCUS_11270	sequence34:53332..53853(-)	frameshift		53346	WP_000072584.1	restriction endonuclease subunit S	97.7	41.9	100.0
MGA_1163	LOCUS_11330	sequence34:59739..60434(-)	partial			WP_000705657.1	superantigen-like protein SSL4	92.2	72.6	42.3
MGA_1196	LOCUS_11660	sequence34:90993..91151(+)	frameshift		90964,91237,90871,91129,91324	WP_047210621.1	site-specific integrase	88.5	11.3	84.8
MGA_1197	LOCUS_11670	sequence34:91229..91540(+)	frameshift		91332,90963,91236,91131	WP_047210621.1	site-specific integrase	75.7	19.2	66.7
MGA_1212	LOCUS_11820	sequence34:105480..106247(-)	frameshift		106305	WP_000199066.1	acetyl-CoA C-acetyltransferase	100.0	64.9	98.8
MGA_1213	LOCUS_11830	sequence34:106264..106653(-)	frameshift		106305	WP_000199066.1	acetyl-CoA C-acetyltransferase	80.6	26.5	100.0
MGA_1274	LOCUS_12440	sequence34:164322..164762(-)	frameshift		164366	WP_000208417.1	DUF5079 family protein	89.7	57.7	85.5
MGA_1276	LOCUS_12460	sequence34:165438..165596(-)	frameshift		165648	WP_000142044.1	TIGR01741 family protein	90.4	28.8	83.0
MGA_1277	LOCUS_12470	sequence34:165640..165792(-)	frameshift		165648	WP_000141941.1	TIGR01741 family protein	96.0	28.9	87.5
MGA_1282	LOCUS_12520	sequence34:168083..168268(-)	frameshift		168353	WP_000208417.1	DUF5079 family protein	100.0	26.9	96.7
MGA_1306	LOCUS_12750	sequence34:194131..194358(-)	partial			WP_126475239.1	IS1182 family transposase	85.3	11.7	98.4
MGA_1329	LOCUS_12980	sequence34:218271..218573(-)	frameshift		218571	WP_000638475.1	2-C-methyl-D-erythritol 4-phosphate cytidylyltransferase	92.0	38.7	100.0
MGA_1330	LOCUS_12990	sequence34:218542..218967(-)	frameshift		218571	WP_000638475.1	2-C-methyl-D-erythritol 4-phosphate cytidylyltransferase	94.3	55.9	97.0
MGA_1374	LOCUS_13430	sequence34:275464..276423(-)	partial			WP_001796914.1	ABC transporter permease	100.0	64.8	91.5
MGA_1529	LOCUS_14920	sequence40:69882..70028(+)	partial			WP_000009238.1	SAS049 family protein	72.9	72.9	100.0
MGA_1576	LOCUS_15390	sequence40:117696..117872(+)	partial			WP_000048060.1	30S ribosomal protein S21	74.1	74.1	100.0
MGA_1665	LOCUS_16280	sequence40:199296..199502(+)	partial			WP_001033761.1	hypothetical protein	92.6	8.8	63.5
MGA_1745	LOCUS_17080	sequence40:313153..313347(+)	frameshift		313344	WP_095092556.1	IS1182 family transposase	68.8	7.8	79.5
MGA_1746	LOCUS_17090	sequence40:313409..313753(+)	frameshift		313344	WP_126475239.1	IS1182 family transposase	99.1	20.7	96.5
MGA_1762	LOCUS_17250	sequence40:329375..329671(-)	partial			WP_126475239.1	IS1182 family transposase	99.0	17.8	95.9
MGA_1812	LOCUS_17750	sequence40:388916..389287(-)	frameshift		389415	WP_000688122.1	GMP reductase	100.0	37.8	99.2
MGA_1813	LOCUS_17760	sequence40:389389..389874(-)	frameshift		389439	WP_000688122.1	GMP reductase	89.4	44.3	99.3
MGA_1837	LOCUS_18000	sequence40:410891..411241(-)	partial			WP_002485350.1	minor capsid protein	100.0	25.9	72.4
MGA_1839	LOCUS_18020	sequence40:411487..411777(-)	internal_stop_codon	411868..411870(-),411787..411789(-)		WP_002485350.1	minor capsid protein	94.8	22.8	45.1
MGA_1843	LOCUS_18060	sequence40:413251..413835(-)	partial			WP_002485350.1	minor capsid protein	68.6	35.5	56.0
MGA_1852	LOCUS_18150	sequence40:421631..421927(-)	frameshift		421929	WP_000068617.1	GTPase HflX	100.0	23.8	100.0
MGA_1853	LOCUS_18160	sequence40:421924..422847(-)	frameshift		421947	WP_000068617.1	GTPase HflX	97.7	72.8	96.0
MGA_1915	LOCUS_18780	sequence40:496724..497404(-)	frameshift		496747	WP_000236726.1	ribosome biogenesis GTPase YlqF	96.9	74.5	99.5
MGA_1916	LOCUS_18790	sequence40:497784..498797(+)	frameshift		498677	WP_000915238.1	lipoteichoic acid-specific glycosyltransferase YfhO	86.4	33.5	97.9
MGA_1917	LOCUS_18800	sequence40:498881..500419(+)	frameshift		498683	WP_000915238.1	lipoteichoic acid-specific glycosyltransferase YfhO	100.0	59.0	92.6
MGA_1945	LOCUS_19080	sequence40:529190..529393(+)	partial			WP_001548522.1	TM2 domain-containing protein	100.0	72.8	100.0
MGA_1964	LOCUS_19270	sequence40:551250..551444(+)	partial			WP_126475239.1	IS1182 family transposase	81.2	9.5	96.2
MGA_2003	LOCUS_19660	sequence40:589890..590216(-)	internal_stop_codon	589890..589892(-)		WP_000584398.1	hypothetical protein	91.7	58.9	87.9
MGA_2080	LOCUS_20430	sequence40:668194..668328(+)	partial			WP_000064214.1	glycopeptide resistance-associated protein GraF	54.5	54.5	100.0
MGA_2118	LOCUS_20810	sequence40:711487..711702(+)	partial			WP_001788574.1	NINE protein	100.0	74.0	97.2
MGA_2284	LOCUS_22470	sequence40:872894..873664(-)	partial			WP_000190248.1	DnaD domain protein	38.3	39.1	43.9
MGA_2297	LOCUS_22600	sequence40:878240..879007(-)	partial			WP_001148557.1	phage antirepressor KilAC domain-containing protein	73.3	72.2	88.2
MGA_2339	LOCUS_23020	sequence40:910590..910709(-)	frameshift		910595	WP_000791702.1	von Willebrand factor binding protein Vwb	94.9	7.4	97.3
MGA_2340	LOCUS_23030	sequence40:910930..913659(-)	partial			WP_001056195.1	MSCRAMM family adhesin clumping factor ClfA	61.5	56.5	82.6
MGA_2371	LOCUS_23340	sequence40:949248..949478(-)	internal_stop_codon	949566..949568(-)		WP_000538141.1	HD domain-containing protein	100.0	35.2	98.7
MGA_2372	LOCUS_23350	sequence40:949566..949898(-)	internal_stop_codon	949566..949568(-)		WP_000538141.1	HD domain-containing protein	100.0	50.9	97.3
MGA_2436	LOCUS_23990	sequence40:1019678..1019962(+)	partial			WP_001801730.1	hypothetical protein	90.4	73.9	100.0
MGA_2440	LOCUS_24030	sequence40:1023822..1024622(-)	frameshift		1023878	WP_000435109.1	aldo/keto reductase family oxidoreductase	93.2	82.1	100.0
MGA_2527	LOCUS_24900	sequence40:1110748..1110993(-)	partial			WP_000020814.1	T7SS effector LXG polymorphic toxin	66.7	11.6	57.4
MGA_2541	LOCUS_25040	sequence40:1122383..1122724(-)	partial			WP_000798967.1	DUF1450 domain-containing protein	69.0	69.0	100.0
MGA_2571	LOCUS_25340	sequence40:1153952..1154107(-)	frameshift		1154376	WP_000934467.1	MSCRAMM family adhesin SdrD	100.0	3.7	88.2
MGA_2573	LOCUS_25360	sequence40:1154349..1157918(-)	frameshift		1154648,1154387,1154726,1154376	WP_000934467.1	MSCRAMM family adhesin SdrD	89.6	76.9	91.8
MGA_2574	LOCUS_25370	sequence40:1158285..1158776(-)	frameshift		1158728,1158729,1158926	WP_001060462.1	MSCRAMM family adhesin SdrC	41.1	7.0	85.1
MGA_2575	LOCUS_25380	sequence40:1158682..1161180(-)	frameshift		1158728,1158732,1158926	WP_001060462.1	MSCRAMM family adhesin SdrC	86.2	75.2	94.7
MGA_2620	LOCUS_25830	sequence41:1..1116(+)	internal_stop_codon	1114..1116(+)		WP_001557163.1	ISL3-like element IS1181 family transposase	100.0	84.5	97.6
