KGX STORAGE

graph-metadata.json
Back to Folder Download File
Size: 12.9 KB Modified: 2026-01-06 07:54:14
JSON Content
{
  "@id": "https://stars.renci.org/var/translator/releases/cohd/2026_01_03/",
  "@type": "sc:Dataset",
  "name": "cohd",
  "description": "A knowledge graph built for the NCATS Biomedical Data Translator project using Translator-Ingests, Biolink Model, and Node Normalizer.",
  "license": "MIT",
  "url": "https://stars.renci.org/var/translator/releases/cohd/2026_01_03/",
  "version": "cohd_2024-11-25_1.0_2025sep1_4.3.6",
  "dateCreated": "2026_01_03",
  "biolinkVersion": "4.3.6",
  "babelVersion": "2025sep1",
  "distribution": [
    {
      "@id": "cohd.tar.xz",
      "@type": "cr:FileObject",
      "contentUrl": "cohd.tar.xz",
      "encodingFormat": "application/x-xz",
      "description": "Compressed tar archive containing the KGX files: nodes.jsonl and edges.jsonl"
    }
  ],
  "isBasedOn": [
    {
      "id": "cohd",
      "name": "Columbia Open Health Data",
      "description": "The COHD provides access to counts and patient prevalence (i.e., prevalence from electronic health records) of conditions, procedures, drug exposures, and patient demographics, and the co-occurrence frequencies between them. Count and frequency data were derived from the Columbia University Irving Medical Center's OHDSI database including inpatient and outpatient data. Counts are the number of patients with the concept, e.g.,  diagnosed with a condition, exposed to a drug, or who had a procedure.  Frequencies are the number of patients with the concept divided by the total number of patients in the dataset. Clinical concepts (e.g., conditions, procedures, drugs) are coded by their standard concept ID in the OMOP Common Data Model.  To protect patient privacy, all concepts and pairs of concepts where the count \u2264 10 were excluded, and counts were randomized by the Poisson distribution.",
      "license": {
        "terms_of_use_url": null,
        "terms_of_use_description": null,
        "license name": null,
        "license url": null
      },
      "url": "https://stars.renci.org/var/data_services/cohd_2/cohd_nodes.jsonl",
      "version": "2024-11-25"
    }
  ],
  "schema": {
    "nodes": [
      {
        "category": [
          "biolink:Drug",
          "biolink:SmallMolecule"
        ],
        "count": 61,
        "id_prefixes": {
          "CHEBI": 59,
          "UNII": 2
        },
        "attributes": {
          "name": 61,
          "equivalent_identifiers": 61,
          "information_content": 25
        }
      },
      {
        "category": [
          "biolink:Drug"
        ],
        "count": 14,
        "id_prefixes": {
          "RXCUI": 8,
          "CHEBI": 4,
          "DRUGBANK": 1,
          "UNII": 1
        },
        "attributes": {
          "name": 14,
          "equivalent_identifiers": 14,
          "information_content": 1
        }
      },
      {
        "category": [
          "biolink:SmallMolecule"
        ],
        "count": 2,
        "id_prefixes": {
          "CHEBI": 2
        },
        "attributes": {
          "name": 2,
          "equivalent_identifiers": 2,
          "information_content": 2
        }
      },
      {
        "category": [
          "biolink:ChemicalEntity"
        ],
        "count": 2,
        "id_prefixes": {
          "CHEBI": 1,
          "MESH": 1
        },
        "attributes": {
          "name": 2,
          "equivalent_identifiers": 2,
          "information_content": 1
        }
      },
      {
        "category": [
          "biolink:Disease"
        ],
        "count": 6,
        "id_prefixes": {
          "DOID": 2,
          "MONDO": 2,
          "UMLS": 2
        },
        "attributes": {
          "name": 6,
          "equivalent_identifiers": 6,
          "information_content": 5
        }
      },
      {
        "category": [
          "biolink:MolecularMixture"
        ],
        "count": 1,
        "id_prefixes": {
          "UNII": 1
        },
        "attributes": {
          "name": 1,
          "equivalent_identifiers": 1
        }
      }
    ],
    "nodes_summary": {
      "total_count": 86,
      "id_prefixes": {
        "CHEBI": 66,
        "RXCUI": 8,
        "UNII": 4,
        "DOID": 2,
        "MONDO": 2,
        "UMLS": 2,
        "DRUGBANK": 1,
        "MESH": 1
      },
      "attributes": {
        "name": 86,
        "equivalent_identifiers": 86,
        "information_content": 34
      }
    },
    "edges": [
      {
        "subject_category": [
          "biolink:Drug",
          "biolink:SmallMolecule"
        ],
        "predicate": "biolink:positively_correlated_with",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 26,
        "primary_knowledge_sources": {
          "infores:cohd": 26
        },
        "qualifiers": {},
        "attributes": {
          "id": 26,
          "category": 26,
          "knowledge_level": 26,
          "agent_type": 26,
          "has_confidence_score": 26,
          "original_subject": 26,
          "original_object": 26
        },
        "subject_id_prefixes": {
          "CHEBI": 25,
          "UNII": 1
        },
        "object_id_prefixes": {
          "MONDO": 26
        }
      },
      {
        "subject_category": [
          "biolink:Disease"
        ],
        "predicate": "biolink:positively_correlated_with",
        "object_category": [
          "biolink:Drug"
        ],
        "count": 5,
        "primary_knowledge_sources": {
          "infores:cohd": 5
        },
        "qualifiers": {},
        "attributes": {
          "id": 5,
          "category": 5,
          "knowledge_level": 5,
          "agent_type": 5,
          "has_confidence_score": 5,
          "original_subject": 5,
          "original_object": 5
        },
        "subject_id_prefixes": {
          "DOID": 5
        },
        "object_id_prefixes": {
          "RXCUI": 4,
          "CHEBI": 1
        }
      },
      {
        "subject_category": [
          "biolink:Disease"
        ],
        "predicate": "biolink:positively_correlated_with",
        "object_category": [
          "biolink:Drug",
          "biolink:SmallMolecule"
        ],
        "count": 21,
        "primary_knowledge_sources": {
          "infores:cohd": 21
        },
        "qualifiers": {},
        "attributes": {
          "id": 21,
          "category": 21,
          "knowledge_level": 21,
          "agent_type": 21,
          "has_confidence_score": 21,
          "original_subject": 21,
          "original_object": 21
        },
        "subject_id_prefixes": {
          "DOID": 21
        },
        "object_id_prefixes": {
          "CHEBI": 19,
          "UNII": 2
        }
      },
      {
        "subject_category": [
          "biolink:Drug",
          "biolink:SmallMolecule"
        ],
        "predicate": "biolink:positively_correlated_with",
        "object_category": [
          "biolink:Drug",
          "biolink:SmallMolecule"
        ],
        "count": 15,
        "primary_knowledge_sources": {
          "infores:cohd": 15
        },
        "qualifiers": {},
        "attributes": {
          "id": 15,
          "category": 15,
          "knowledge_level": 15,
          "agent_type": 15,
          "has_confidence_score": 15,
          "original_subject": 15,
          "original_object": 15
        },
        "subject_id_prefixes": {
          "CHEBI": 15
        },
        "object_id_prefixes": {
          "CHEBI": 15
        }
      },
      {
        "subject_category": [
          "biolink:Drug",
          "biolink:SmallMolecule"
        ],
        "predicate": "biolink:positively_correlated_with",
        "object_category": [
          "biolink:Drug"
        ],
        "count": 3,
        "primary_knowledge_sources": {
          "infores:cohd": 3
        },
        "qualifiers": {},
        "attributes": {
          "id": 3,
          "category": 3,
          "knowledge_level": 3,
          "agent_type": 3,
          "has_confidence_score": 3,
          "original_subject": 3,
          "original_object": 3
        },
        "subject_id_prefixes": {
          "CHEBI": 3
        },
        "object_id_prefixes": {
          "UNII": 1,
          "RXCUI": 1,
          "CHEBI": 1
        }
      },
      {
        "subject_category": [
          "biolink:Drug",
          "biolink:SmallMolecule"
        ],
        "predicate": "biolink:negatively_correlated_with",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 2,
        "primary_knowledge_sources": {
          "infores:cohd": 2
        },
        "qualifiers": {},
        "attributes": {
          "id": 2,
          "category": 2,
          "knowledge_level": 2,
          "agent_type": 2,
          "has_confidence_score": 2,
          "original_subject": 2,
          "original_object": 2
        },
        "subject_id_prefixes": {
          "CHEBI": 2
        },
        "object_id_prefixes": {
          "MONDO": 2
        }
      },
      {
        "subject_category": [
          "biolink:Drug"
        ],
        "predicate": "biolink:positively_correlated_with",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 6,
        "primary_knowledge_sources": {
          "infores:cohd": 6
        },
        "qualifiers": {},
        "attributes": {
          "id": 6,
          "category": 6,
          "knowledge_level": 6,
          "agent_type": 6,
          "has_confidence_score": 6,
          "original_subject": 6,
          "original_object": 6
        },
        "subject_id_prefixes": {
          "RXCUI": 3,
          "CHEBI": 2,
          "DRUGBANK": 1
        },
        "object_id_prefixes": {
          "MONDO": 6
        }
      },
      {
        "subject_category": [
          "biolink:SmallMolecule"
        ],
        "predicate": "biolink:positively_correlated_with",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 2,
        "primary_knowledge_sources": {
          "infores:cohd": 2
        },
        "qualifiers": {},
        "attributes": {
          "id": 2,
          "category": 2,
          "knowledge_level": 2,
          "agent_type": 2,
          "has_confidence_score": 2,
          "original_subject": 2,
          "original_object": 2
        },
        "subject_id_prefixes": {
          "CHEBI": 2
        },
        "object_id_prefixes": {
          "MONDO": 2
        }
      },
      {
        "subject_category": [
          "biolink:Disease"
        ],
        "predicate": "biolink:positively_correlated_with",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 1,
        "primary_knowledge_sources": {
          "infores:cohd": 1
        },
        "qualifiers": {},
        "attributes": {
          "id": 1,
          "category": 1,
          "knowledge_level": 1,
          "agent_type": 1,
          "has_confidence_score": 1,
          "original_subject": 1,
          "original_object": 1
        },
        "subject_id_prefixes": {
          "UMLS": 1
        },
        "object_id_prefixes": {
          "UMLS": 1
        }
      },
      {
        "subject_category": [
          "biolink:ChemicalEntity"
        ],
        "predicate": "biolink:positively_correlated_with",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 2,
        "primary_knowledge_sources": {
          "infores:cohd": 2
        },
        "qualifiers": {},
        "attributes": {
          "id": 2,
          "category": 2,
          "knowledge_level": 2,
          "agent_type": 2,
          "has_confidence_score": 2,
          "original_subject": 2,
          "original_object": 2
        },
        "subject_id_prefixes": {
          "CHEBI": 1,
          "MESH": 1
        },
        "object_id_prefixes": {
          "MONDO": 2
        }
      },
      {
        "subject_category": [
          "biolink:MolecularMixture"
        ],
        "predicate": "biolink:positively_correlated_with",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 1,
        "primary_knowledge_sources": {
          "infores:cohd": 1
        },
        "qualifiers": {},
        "attributes": {
          "id": 1,
          "category": 1,
          "knowledge_level": 1,
          "agent_type": 1,
          "has_confidence_score": 1,
          "original_subject": 1,
          "original_object": 1
        },
        "subject_id_prefixes": {
          "UNII": 1
        },
        "object_id_prefixes": {
          "MONDO": 1
        }
      }
    ],
    "edges_summary": {
      "total_count": 84,
      "predicates": {
        "biolink:positively_correlated_with": 82,
        "biolink:negatively_correlated_with": 2
      },
      "primary_knowledge_sources": {
        "infores:cohd": 84
      },
      "predicates_by_knowledge_source": {
        "infores:cohd": {
          "biolink:positively_correlated_with": 82,
          "biolink:negatively_correlated_with": 2
        }
      },
      "qualifiers": {},
      "attributes": {
        "id": 84,
        "category": 84,
        "knowledge_level": 84,
        "agent_type": 84,
        "has_confidence_score": 84,
        "original_subject": 84,
        "original_object": 84
      }
    }
  }
}