{"end": 4150, "species": "Candidatus Rokuibacteriota bacterium", "length": 365, "features": [{"end": 4010, "phase": ".", "attributes": {"gene_biotype": "protein_coding", "Name": "Q7W02_16005", "locus_tag": "Q7W02_16005", "gbkey": "Gene", "ID": "gene-Q7W02_16005"}, "source": "Genbank", "type": "gene", "start": 3270, "seqid": "JAUSJX010000087.1", "score": ".", "strand": "-"}, {"seqid": "JAUSJX010000087.1", "start": 3270, "phase": "0", "source": "Protein Homology", "strand": "-", "score": ".", "end": 4010, "type": "CDS", "attributes": {"Dbxref": "NCBI_GP:MDO8477668.1", "go_component": "external side of cell outer membrane|0031240||IEA", "Ontology_term": "GO:0031240", "protein_id": "MDO8477668.1", "ID": "cds-MDO8477668.1", "Parent": "gene-Q7W02_16005", "transl_table": "11", "product": "PEP-CTERM sorting domain-containing protein", "gbkey": "CDS", "Name": "MDO8477668.1", "Note": "PEP-CTERM proteins occur%2C often in large numbers%2C in the proteomes of bacteria that also encode an exosortase%2C a predicted intramembrane cysteine proteinase. The presence of a PEP-CTERM domain at a protein's C-terminus predicts cleavage within the sorting domain%2C followed by covalent anchoring to some some component of the (usually Gram-negative) cell surface. Many PEP-CTERM proteins exhibit an unusual sequence composition that includes large numbers of potential glycosylation sites. Expression of one such protein has been shown restore the ability of a bacterium to form floc%2C a type of biofilm.", "inference": "COORDINATES: protein motif:HMM:TIGR02595.1", "locus_tag": "Q7W02_16005"}}], "seqid": "JAUSJX010000087.1", "start": 3786, "taxonomy": "d__Bacteria;p__Methylomirabilota;c__Methylomirabilia;o__Rokubacteriales;f__CSP1-6;g__AR37;s__AR37 sp030647435", "accession": "GCA_030647435.1", "is_reverse_complement": false, "sequence": "GAACGCCCCTGCATTGACGTCTCGCGAGACAAATGGCGACGGGCTGACCAGTCTGACGGTCTGGGAGCCGACCGCAAAGCCCGTCACCTTGAGCACGTCCGCGCGCGCCGCCGGCGCGAACGTGAGGGGGGCGCTCAGCAAGCAGAGCGCAAGGATTCCACACTGAAACGATCTCATGAATCCTCTCTCCTTATCTAAGTGACTCAAGATCGCCGTATCGGTCATGTAAGGAGCGTCCGCAGCTCGGGCCATGAAGCGGCTGGATCTGACGCTCGCGCCAGTCAATTGCAAGGATGGCGCCATGAGTTCAGGTGTGTGTGGGAAGACACTTACGCGCAGGTGCTGAATCCAGATGAGTCAGGCAG"}