ChEMBL · Schema

ChEMBL Target

A biological target in ChEMBL, which can be a single protein, protein complex, organism, cell line, nucleic acid, or other biological entity.

Drug DiscoveryBioactivityMoleculesCheminformaticsLife SciencesBioinformaticsPharmacologyEMBL-EBI

Properties

Name Type Description
target_chembl_id string Unique ChEMBL identifier for the target
pref_name string Preferred name for the target (manually curated)
target_type string Classification of the target type
organism stringnull Source organism of the target (e.g., Homo sapiens)
tax_id integernull NCBI taxonomy ID of the target organism
species_group_flag booleannull Indicates if the target represents a group of species rather than a single organism
target_components array Protein components (sequences) that make up this target
cross_references array Cross-references to external databases
View JSON Schema on GitHub

JSON Schema

target.json Raw ↑
{
  "$schema": "https://json-schema.org/draft/2020-12/schema",
  "$id": "https://www.ebi.ac.uk/chembl/schema/target",
  "title": "ChEMBL Target",
  "description": "A biological target in ChEMBL, which can be a single protein, protein complex, organism, cell line, nucleic acid, or other biological entity.",
  "type": "object",
  "properties": {
    "target_chembl_id": {
      "type": "string",
      "pattern": "^CHEMBL[0-9]+$",
      "description": "Unique ChEMBL identifier for the target"
    },
    "pref_name": {
      "type": "string",
      "description": "Preferred name for the target (manually curated)"
    },
    "target_type": {
      "type": "string",
      "enum": [
        "SINGLE PROTEIN",
        "PROTEIN COMPLEX",
        "PROTEIN FAMILY",
        "PROTEIN COMPLEX GROUP",
        "SELECTIVITY GROUP",
        "ORGANISM",
        "TISSUE",
        "CELL-LINE",
        "NUCLEIC-ACID",
        "ADMET",
        "SUBCELLULAR",
        "METAL",
        "CHIMERIC PROTEIN",
        "PROTEIN PROTEIN INTERACTION",
        "UNKNOWN"
      ],
      "description": "Classification of the target type"
    },
    "organism": {
      "type": ["string", "null"],
      "description": "Source organism of the target (e.g., Homo sapiens)"
    },
    "tax_id": {
      "type": ["integer", "null"],
      "description": "NCBI taxonomy ID of the target organism"
    },
    "species_group_flag": {
      "type": ["boolean", "null"],
      "description": "Indicates if the target represents a group of species rather than a single organism"
    },
    "target_components": {
      "type": "array",
      "description": "Protein components (sequences) that make up this target",
      "items": {
        "type": "object",
        "properties": {
          "accession": {
            "type": ["string", "null"],
            "description": "UniProt accession number for the protein component"
          },
          "component_description": {
            "type": ["string", "null"],
            "description": "Description of the component"
          },
          "component_id": {
            "type": "integer"
          },
          "component_type": {
            "type": "string",
            "enum": ["PROTEIN", "DNA", "RNA"],
            "description": "Type of component sequence"
          },
          "relationship": {
            "type": "string",
            "description": "Relationship of this component to the target (e.g., SINGLE PROTEIN, SUBUNIT)"
          },
          "target_component_id": {
            "type": "integer"
          }
        }
      }
    },
    "cross_references": {
      "type": "array",
      "description": "Cross-references to external databases",
      "items": {
        "type": "object",
        "properties": {
          "xref_id": {"type": "string"},
          "xref_name": {"type": ["string", "null"]},
          "xref_src": {"type": "string", "description": "Source database abbreviation (e.g., UniProt, Ensembl, HGNC)"}
        }
      }
    }
  },
  "required": ["target_chembl_id", "pref_name", "target_type"],
  "examples": [
    {
      "target_chembl_id": "CHEMBL301",
      "pref_name": "Cyclooxygenase-2",
      "target_type": "SINGLE PROTEIN",
      "organism": "Homo sapiens",
      "tax_id": 9606,
      "species_group_flag": false,
      "target_components": [
        {
          "accession": "P35354",
          "component_description": "Prostaglandin G/H synthase 2",
          "component_id": 382,
          "component_type": "PROTEIN",
          "relationship": "SINGLE PROTEIN",
          "target_component_id": 382
        }
      ],
      "cross_references": [
        {
          "xref_id": "P35354",
          "xref_name": "PTGS2_HUMAN",
          "xref_src": "UniProt"
        },
        {
          "xref_id": "ENSG00000073756",
          "xref_name": "PTGS2",
          "xref_src": "Ensembl"
        }
      ]
    }
  ]
}