{"accession": "GCF_901538265.1", "is_reverse_complement": false, "start": 9439835, "features": [{"start": 9439947, "attributes": {"Name": "WP_162672681.1", "Dbxref": "GenBank:WP_162672681.1", "ID": "cds-WP_162672681.1", "locus_tag": "SOIL9_RS39610", "Parent": "gene-SOIL9_RS39610", "protein_id": "WP_162672681.1", "product": "DUF1464 family protein", "inference": "COORDINATES: similar to AA sequence:RefSeq:WP_015248220.1", "transl_table": "11", "gbkey": "CDS"}, "source": "Protein Homology", "type": "CDS", "score": ".", "end": 9440981, "phase": "0", "seqid": "NZ_LR593886.1", "strand": "+"}, {"attributes": {"gene_biotype": "protein_coding", "Name": "SOIL9_RS39605", "old_locus_tag": "SOIL9_75890", "ID": "gene-SOIL9_RS39605", "locus_tag": "SOIL9_RS39605", "gbkey": "Gene"}, "strand": "+", "type": "gene", "phase": ".", "source": "RefSeq", "start": 9439298, "end": 9439936, "seqid": "NZ_LR593886.1", "score": "."}, {"source": "RefSeq", "seqid": "NZ_LR593886.1", "start": 9439947, "strand": "+", "score": ".", "phase": ".", "end": 9440981, "attributes": {"locus_tag": "SOIL9_RS39610", "ID": "gene-SOIL9_RS39610", "old_locus_tag": "SOIL9_75880", "Name": "SOIL9_RS39610", "gene_biotype": "protein_coding", "gbkey": "Gene"}, "type": "gene"}, {"start": 9439298, "strand": "+", "type": "CDS", "end": 9439936, "source": "GeneMarkS-2+", "phase": "0", "seqid": "NZ_LR593886.1", "attributes": {"Ontology_term": "GO:0031240", "go_component": "external side of cell outer membrane|0031240||IEA", "product": "PEP-CTERM sorting domain-containing protein", "transl_table": "11", "Name": "WP_162672680.1", "Dbxref": "GenBank:WP_162672680.1", "Note": "PEP-CTERM proteins occur%2C often in large numbers%2C in the proteomes of bacteria that also encode an exosortase%2C a predicted intramembrane cysteine proteinase. The presence of a PEP-CTERM domain at a protein's C-terminus predicts cleavage within the sorting domain%2C followed by covalent anchoring to some some component of the (usually Gram-negative) cell surface. Many PEP-CTERM proteins exhibit an unusual sequence composition that includes large numbers of potential glycosylation sites. Expression of one such protein has been shown restore the ability of a bacterium to form floc%2C a type of biofilm.", "protein_id": "WP_162672680.1", "ID": "cds-WP_162672680.1", "gbkey": "CDS", "inference": "COORDINATES: ab initio prediction:GeneMarkS-2+", "locus_tag": "SOIL9_RS39605", "Parent": "gene-SOIL9_RS39605"}, "score": "."}], "end": 9440300, "seqid": "NZ_LR593886.1", "sequence": "CCGAACGTGCCGGCCACACTCAGCCCGGAACCCGGGACGCTGGCACTGTTCGCGCTGGGATTGGCCCCCCTGGGACTGCGCCGGTTGCGGCGGATCTGGTAGAACTCTTCTCATGCCCCGCGTAGCTGGTTGTGACCCGGGAACGTCGTCGCTCGACATGCTCGCGCTCGAAGACGGGCGCGTCGTGGCCCAAGTGCGTATCGAACCGGATGAGCTGCGCGCCGATCCGACCATTCCCGTGCAGTGGCTCCGAGCCGAGGGGCCGTTCGATCTCATCGCGGGACCATCAGGTTACGGACTGCCTCTGGTACACGCGGCGGATTGCACGGACACGCAACTCGATCTGATGTCGCTGGTGCGCCCCGACGAGCGAGGCGCAGGGGGCGTTGGCGGGTTCTCTGCGATGGCCCGTGCGCTGCGCGATTCCGGGTTACCCGTAGTGTTCCTCCCCGGTGTCATCCACCTC", "species": "Gemmata massiliana", "length": 466, "taxonomy": "d__Bacteria;p__Planctomycetota;c__Planctomycetia;o__Gemmatales;f__Gemmataceae;g__Gemmata;s__Gemmata massiliana_A"}