{
"@id": "https://stars.renci.org/var/translator/releases/cohd/2026_01_03/",
"@type": "sc:Dataset",
"name": "cohd",
"description": "A knowledge graph built for the NCATS Biomedical Data Translator project using Translator-Ingests, Biolink Model, and Node Normalizer.",
"license": "MIT",
"url": "https://stars.renci.org/var/translator/releases/cohd/2026_01_03/",
"version": "cohd_2024-11-25_1.0_2025sep1_4.3.6",
"dateCreated": "2026_01_03",
"biolinkVersion": "4.3.6",
"babelVersion": "2025sep1",
"distribution": [
{
"@id": "cohd.tar.xz",
"@type": "cr:FileObject",
"contentUrl": "cohd.tar.xz",
"encodingFormat": "application/x-xz",
"description": "Compressed tar archive containing the KGX files: nodes.jsonl and edges.jsonl"
}
],
"isBasedOn": [
{
"id": "cohd",
"name": "Columbia Open Health Data",
"description": "The COHD provides access to counts and patient prevalence (i.e., prevalence from electronic health records) of conditions, procedures, drug exposures, and patient demographics, and the co-occurrence frequencies between them. Count and frequency data were derived from the Columbia University Irving Medical Center's OHDSI database including inpatient and outpatient data. Counts are the number of patients with the concept, e.g., diagnosed with a condition, exposed to a drug, or who had a procedure. Frequencies are the number of patients with the concept divided by the total number of patients in the dataset. Clinical concepts (e.g., conditions, procedures, drugs) are coded by their standard concept ID in the OMOP Common Data Model. To protect patient privacy, all concepts and pairs of concepts where the count \u2264 10 were excluded, and counts were randomized by the Poisson distribution.",
"license": {
"terms_of_use_url": null,
"terms_of_use_description": null,
"license name": null,
"license url": null
},
"url": "https://stars.renci.org/var/data_services/cohd_2/cohd_nodes.jsonl",
"version": "2024-11-25"
}
],
"schema": {
"nodes": [
{
"category": [
"biolink:Drug",
"biolink:SmallMolecule"
],
"count": 61,
"id_prefixes": {
"CHEBI": 59,
"UNII": 2
},
"attributes": {
"name": 61,
"equivalent_identifiers": 61,
"information_content": 25
}
},
{
"category": [
"biolink:Drug"
],
"count": 14,
"id_prefixes": {
"RXCUI": 8,
"CHEBI": 4,
"DRUGBANK": 1,
"UNII": 1
},
"attributes": {
"name": 14,
"equivalent_identifiers": 14,
"information_content": 1
}
},
{
"category": [
"biolink:SmallMolecule"
],
"count": 2,
"id_prefixes": {
"CHEBI": 2
},
"attributes": {
"name": 2,
"equivalent_identifiers": 2,
"information_content": 2
}
},
{
"category": [
"biolink:ChemicalEntity"
],
"count": 2,
"id_prefixes": {
"CHEBI": 1,
"MESH": 1
},
"attributes": {
"name": 2,
"equivalent_identifiers": 2,
"information_content": 1
}
},
{
"category": [
"biolink:Disease"
],
"count": 6,
"id_prefixes": {
"DOID": 2,
"MONDO": 2,
"UMLS": 2
},
"attributes": {
"name": 6,
"equivalent_identifiers": 6,
"information_content": 5
}
},
{
"category": [
"biolink:MolecularMixture"
],
"count": 1,
"id_prefixes": {
"UNII": 1
},
"attributes": {
"name": 1,
"equivalent_identifiers": 1
}
}
],
"nodes_summary": {
"total_count": 86,
"id_prefixes": {
"CHEBI": 66,
"RXCUI": 8,
"UNII": 4,
"DOID": 2,
"MONDO": 2,
"UMLS": 2,
"DRUGBANK": 1,
"MESH": 1
},
"attributes": {
"name": 86,
"equivalent_identifiers": 86,
"information_content": 34
}
},
"edges": [
{
"subject_category": [
"biolink:Drug",
"biolink:SmallMolecule"
],
"predicate": "biolink:positively_correlated_with",
"object_category": [
"biolink:Disease"
],
"count": 26,
"primary_knowledge_sources": {
"infores:cohd": 26
},
"qualifiers": {},
"attributes": {
"id": 26,
"category": 26,
"knowledge_level": 26,
"agent_type": 26,
"has_confidence_score": 26,
"original_subject": 26,
"original_object": 26
},
"subject_id_prefixes": {
"CHEBI": 25,
"UNII": 1
},
"object_id_prefixes": {
"MONDO": 26
}
},
{
"subject_category": [
"biolink:Disease"
],
"predicate": "biolink:positively_correlated_with",
"object_category": [
"biolink:Drug"
],
"count": 5,
"primary_knowledge_sources": {
"infores:cohd": 5
},
"qualifiers": {},
"attributes": {
"id": 5,
"category": 5,
"knowledge_level": 5,
"agent_type": 5,
"has_confidence_score": 5,
"original_subject": 5,
"original_object": 5
},
"subject_id_prefixes": {
"DOID": 5
},
"object_id_prefixes": {
"RXCUI": 4,
"CHEBI": 1
}
},
{
"subject_category": [
"biolink:Disease"
],
"predicate": "biolink:positively_correlated_with",
"object_category": [
"biolink:Drug",
"biolink:SmallMolecule"
],
"count": 21,
"primary_knowledge_sources": {
"infores:cohd": 21
},
"qualifiers": {},
"attributes": {
"id": 21,
"category": 21,
"knowledge_level": 21,
"agent_type": 21,
"has_confidence_score": 21,
"original_subject": 21,
"original_object": 21
},
"subject_id_prefixes": {
"DOID": 21
},
"object_id_prefixes": {
"CHEBI": 19,
"UNII": 2
}
},
{
"subject_category": [
"biolink:Drug",
"biolink:SmallMolecule"
],
"predicate": "biolink:positively_correlated_with",
"object_category": [
"biolink:Drug",
"biolink:SmallMolecule"
],
"count": 15,
"primary_knowledge_sources": {
"infores:cohd": 15
},
"qualifiers": {},
"attributes": {
"id": 15,
"category": 15,
"knowledge_level": 15,
"agent_type": 15,
"has_confidence_score": 15,
"original_subject": 15,
"original_object": 15
},
"subject_id_prefixes": {
"CHEBI": 15
},
"object_id_prefixes": {
"CHEBI": 15
}
},
{
"subject_category": [
"biolink:Drug",
"biolink:SmallMolecule"
],
"predicate": "biolink:positively_correlated_with",
"object_category": [
"biolink:Drug"
],
"count": 3,
"primary_knowledge_sources": {
"infores:cohd": 3
},
"qualifiers": {},
"attributes": {
"id": 3,
"category": 3,
"knowledge_level": 3,
"agent_type": 3,
"has_confidence_score": 3,
"original_subject": 3,
"original_object": 3
},
"subject_id_prefixes": {
"CHEBI": 3
},
"object_id_prefixes": {
"UNII": 1,
"RXCUI": 1,
"CHEBI": 1
}
},
{
"subject_category": [
"biolink:Drug",
"biolink:SmallMolecule"
],
"predicate": "biolink:negatively_correlated_with",
"object_category": [
"biolink:Disease"
],
"count": 2,
"primary_knowledge_sources": {
"infores:cohd": 2
},
"qualifiers": {},
"attributes": {
"id": 2,
"category": 2,
"knowledge_level": 2,
"agent_type": 2,
"has_confidence_score": 2,
"original_subject": 2,
"original_object": 2
},
"subject_id_prefixes": {
"CHEBI": 2
},
"object_id_prefixes": {
"MONDO": 2
}
},
{
"subject_category": [
"biolink:Drug"
],
"predicate": "biolink:positively_correlated_with",
"object_category": [
"biolink:Disease"
],
"count": 6,
"primary_knowledge_sources": {
"infores:cohd": 6
},
"qualifiers": {},
"attributes": {
"id": 6,
"category": 6,
"knowledge_level": 6,
"agent_type": 6,
"has_confidence_score": 6,
"original_subject": 6,
"original_object": 6
},
"subject_id_prefixes": {
"RXCUI": 3,
"CHEBI": 2,
"DRUGBANK": 1
},
"object_id_prefixes": {
"MONDO": 6
}
},
{
"subject_category": [
"biolink:SmallMolecule"
],
"predicate": "biolink:positively_correlated_with",
"object_category": [
"biolink:Disease"
],
"count": 2,
"primary_knowledge_sources": {
"infores:cohd": 2
},
"qualifiers": {},
"attributes": {
"id": 2,
"category": 2,
"knowledge_level": 2,
"agent_type": 2,
"has_confidence_score": 2,
"original_subject": 2,
"original_object": 2
},
"subject_id_prefixes": {
"CHEBI": 2
},
"object_id_prefixes": {
"MONDO": 2
}
},
{
"subject_category": [
"biolink:Disease"
],
"predicate": "biolink:positively_correlated_with",
"object_category": [
"biolink:Disease"
],
"count": 1,
"primary_knowledge_sources": {
"infores:cohd": 1
},
"qualifiers": {},
"attributes": {
"id": 1,
"category": 1,
"knowledge_level": 1,
"agent_type": 1,
"has_confidence_score": 1,
"original_subject": 1,
"original_object": 1
},
"subject_id_prefixes": {
"UMLS": 1
},
"object_id_prefixes": {
"UMLS": 1
}
},
{
"subject_category": [
"biolink:ChemicalEntity"
],
"predicate": "biolink:positively_correlated_with",
"object_category": [
"biolink:Disease"
],
"count": 2,
"primary_knowledge_sources": {
"infores:cohd": 2
},
"qualifiers": {},
"attributes": {
"id": 2,
"category": 2,
"knowledge_level": 2,
"agent_type": 2,
"has_confidence_score": 2,
"original_subject": 2,
"original_object": 2
},
"subject_id_prefixes": {
"CHEBI": 1,
"MESH": 1
},
"object_id_prefixes": {
"MONDO": 2
}
},
{
"subject_category": [
"biolink:MolecularMixture"
],
"predicate": "biolink:positively_correlated_with",
"object_category": [
"biolink:Disease"
],
"count": 1,
"primary_knowledge_sources": {
"infores:cohd": 1
},
"qualifiers": {},
"attributes": {
"id": 1,
"category": 1,
"knowledge_level": 1,
"agent_type": 1,
"has_confidence_score": 1,
"original_subject": 1,
"original_object": 1
},
"subject_id_prefixes": {
"UNII": 1
},
"object_id_prefixes": {
"MONDO": 1
}
}
],
"edges_summary": {
"total_count": 84,
"predicates": {
"biolink:positively_correlated_with": 82,
"biolink:negatively_correlated_with": 2
},
"primary_knowledge_sources": {
"infores:cohd": 84
},
"predicates_by_knowledge_source": {
"infores:cohd": {
"biolink:positively_correlated_with": 82,
"biolink:negatively_correlated_with": 2
}
},
"qualifiers": {},
"attributes": {
"id": 84,
"category": 84,
"knowledge_level": 84,
"agent_type": 84,
"has_confidence_score": 84,
"original_subject": 84,
"original_object": 84
}
}
}
}