{
  "@id": "https://kgx-storage.rtx.ai/releases/hpoa/2026_04_21/",
  "@type": "sc:Dataset",
  "name": "hpoa",
  "description": "A knowledge graph built for the NCATS Biomedical Data Translator project using Translator-Ingests, Biolink Model, and Node Normalizer.",
  "license": "MIT",
  "url": "https://kgx-storage.rtx.ai/releases/hpoa/2026_04_21/",
  "version": "hpoa_2026-02-16_e80fcfa7_2025sep1_4.3.6",
  "dateCreated": "2026_04_21",
  "biolinkVersion": "4.3.6",
  "babelVersion": "2025sep1",
  "distribution": [
    {
      "@id": "hpoa.tar.xz",
      "@type": "cr:FileObject",
      "contentUrl": "hpoa.tar.xz",
      "encodingFormat": "application/x-xz",
      "description": "Compressed tar archive containing the KGX files: nodes.jsonl and edges.jsonl"
    }
  ],
  "isBasedOn": [
    {
      "id": "hpoa",
      "name": "Human Phenotype Ontology Annotations",
      "description": "The [Human Phenotype Ontology (HPO)](https://hpo.jax.org/) provides a  standard vocabulary of phenotypic abnormalities encountered in human disease. Each term in the HPO describes a phenotypic abnormality, such as Atrial septal defect.  The HPO is currently being developed using the medical literature, Orphanet, DECIPHER, and OMIM.  HPO currently contains over 18,000 terms and over 156,000 annotations to hereditary diseases.  The HPO project and others have developed software for phenotype-driven differential diagnostics, genomic diagnostics, and translational research.\nThe Human Phenotype Ontology group curates and assembles over 115,000 HPO-related annotations (\"HPOA\") to hereditary diseases using the HPO ontology. Here we create Biolink associations between diseases and phenotypic features, together with their evidence, and age of onset and frequency (if known). Disease annotations here are also cross-referenced to the MONarch Disease Ontology (MONDO) (https://mondo.monarchinitiative.org/).\nThere are four HPOA ingests ('disease-to-phenotype' (includes capture of disease modes of inheritance, 'gene-to-phenotype' and 'gene-to-disease') that parse out records from the  HPO Phenotype Annotation File (http://purl.obolibrary.org/obo/hp/hpoa/phenotype.hpoa).",
      "license": {
        "terms_of_use_url": "https://hpo.jax.org/license",
        "terms_of_use_description": "Bespoke terms describing specific conditions for use of HPOA data. No formal license."
      },
      "url": [
        "https://hpo.jax.org/data/annotations"
      ],
      "version": "2026-02-16"
    }
  ],
  "schema": {
    "nodes": [
      {
        "category": [
          "biolink:Disease"
        ],
        "count": 12262,
        "id_prefixes": {
          "MONDO": 11792,
          "OMIM": 331,
          "orphanet": 108,
          "DOID": 22,
          "UMLS": 9
        },
        "attributes": {
          "name": 12262,
          "equivalent_identifiers": 12262,
          "information_content": 11848,
          "description": 8274,
          "inheritance": 240
        }
      },
      {
        "category": [
          "biolink:PhenotypicFeature"
        ],
        "count": 9553,
        "id_prefixes": {
          "HP": 9553
        },
        "attributes": {
          "name": 9553,
          "equivalent_identifiers": 9553,
          "information_content": 9553,
          "description": 8215
        }
      },
      {
        "category": [
          "biolink:Gene",
          "biolink:Protein"
        ],
        "count": 5257,
        "id_prefixes": {
          "NCBIGene": 5257
        },
        "attributes": {
          "name": 5257,
          "equivalent_identifiers": 5257,
          "information_content": 5257,
          "description": 5257,
          "inheritance": 1
        }
      },
      {
        "category": [
          "biolink:Gene"
        ],
        "count": 101,
        "id_prefixes": {
          "NCBIGene": 101
        },
        "attributes": {
          "name": 101,
          "equivalent_identifiers": 101,
          "description": 89,
          "information_content": 60
        }
      }
    ],
    "nodes_summary": {
      "total_count": 27173,
      "id_prefixes": {
        "MONDO": 11792,
        "HP": 9553,
        "NCBIGene": 5358,
        "OMIM": 331,
        "orphanet": 108,
        "DOID": 22,
        "UMLS": 9
      },
      "attributes": {
        "name": 27173,
        "equivalent_identifiers": 27173,
        "information_content": 26718,
        "description": 21835,
        "inheritance": 241
      }
    },
    "edges": [
      {
        "subject_category": [
          "biolink:Gene",
          "biolink:Protein"
        ],
        "predicate": "biolink:associated_with",
        "object_category": [
          "biolink:PhenotypicFeature"
        ],
        "count": 210690,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 210690
        },
        "qualifiers": {
          "qualified_predicate": 210690,
          "disease_context_qualifier": 210690,
          "subject_form_or_variant_qualifier": 210690,
          "frequency_qualifier": 174533
        },
        "attributes": {
          "id": 210690,
          "category": 210690,
          "publications": 210690,
          "knowledge_level": 210690,
          "agent_type": 210690,
          "original_subject": 210690,
          "original_object": 210690,
          "has_quotient": 66104,
          "has_percentage": 66104,
          "has_count": 66055,
          "has_total": 66055
        },
        "subject_id_prefixes": {
          "NCBIGene": 210690
        },
        "object_id_prefixes": {
          "HP": 210690
        }
      },
      {
        "subject_category": [
          "biolink:Gene",
          "biolink:Protein"
        ],
        "predicate": "biolink:associated_with",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 115504,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 115504
        },
        "qualifiers": {
          "qualified_predicate": 115504,
          "subject_form_or_variant_qualifier": 115504,
          "disease_context_qualifier": 108112,
          "frequency_qualifier": 91975
        },
        "attributes": {
          "id": 115504,
          "category": 115504,
          "knowledge_level": 115504,
          "agent_type": 115504,
          "original_subject": 115504,
          "original_object": 115504,
          "publications": 108112,
          "has_quotient": 29612,
          "has_percentage": 29612,
          "has_count": 29519,
          "has_total": 29519
        },
        "subject_id_prefixes": {
          "NCBIGene": 115504
        },
        "object_id_prefixes": {
          "MONDO": 115111,
          "OMIM": 256,
          "UMLS": 109,
          "DOID": 28
        }
      },
      {
        "subject_category": [
          "biolink:Disease"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:PhenotypicFeature"
        ],
        "count": 171041,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 171041
        },
        "qualifiers": {
          "frequency_qualifier": 136646,
          "onset_qualifier": 1645,
          "sex_qualifier": 256
        },
        "attributes": {
          "id": 171041,
          "category": 171041,
          "negated": 171041,
          "publications": 171041,
          "has_evidence_of_type": 171041,
          "knowledge_level": 171041,
          "agent_type": 171041,
          "original_subject": 171041,
          "original_object": 171041,
          "has_quotient": 60397,
          "has_percentage": 60397,
          "has_count": 60352,
          "has_total": 60352
        },
        "subject_id_prefixes": {
          "MONDO": 166894,
          "OMIM": 1970,
          "orphanet": 1959,
          "DOID": 218
        },
        "object_id_prefixes": {
          "HP": 171041
        }
      },
      {
        "subject_category": [
          "biolink:Gene"
        ],
        "predicate": "biolink:associated_with",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 2290,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 2290
        },
        "qualifiers": {
          "qualified_predicate": 2290,
          "subject_form_or_variant_qualifier": 2290,
          "disease_context_qualifier": 2169,
          "frequency_qualifier": 1774
        },
        "attributes": {
          "id": 2290,
          "category": 2290,
          "knowledge_level": 2290,
          "agent_type": 2290,
          "original_subject": 2290,
          "original_object": 2290,
          "publications": 2169,
          "has_count": 535,
          "has_total": 535,
          "has_quotient": 535,
          "has_percentage": 535
        },
        "subject_id_prefixes": {
          "NCBIGene": 2290
        },
        "object_id_prefixes": {
          "MONDO": 2281,
          "UMLS": 5,
          "OMIM": 4
        }
      },
      {
        "subject_category": [
          "biolink:Gene"
        ],
        "predicate": "biolink:associated_with",
        "object_category": [
          "biolink:PhenotypicFeature"
        ],
        "count": 3941,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 3941
        },
        "qualifiers": {
          "qualified_predicate": 3941,
          "disease_context_qualifier": 3941,
          "subject_form_or_variant_qualifier": 3941,
          "frequency_qualifier": 3251
        },
        "attributes": {
          "id": 3941,
          "category": 3941,
          "publications": 3941,
          "knowledge_level": 3941,
          "agent_type": 3941,
          "original_subject": 3941,
          "original_object": 3941,
          "has_quotient": 1143,
          "has_percentage": 1143,
          "has_count": 1141,
          "has_total": 1141
        },
        "subject_id_prefixes": {
          "NCBIGene": 3941
        },
        "object_id_prefixes": {
          "HP": 3941
        }
      },
      {
        "subject_category": [
          "biolink:Disease"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 87037,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 87037
        },
        "qualifiers": {
          "frequency_qualifier": 68616,
          "onset_qualifier": 1394,
          "sex_qualifier": 331
        },
        "attributes": {
          "id": 87037,
          "category": 87037,
          "negated": 87037,
          "publications": 87037,
          "has_evidence_of_type": 87037,
          "knowledge_level": 87037,
          "agent_type": 87037,
          "original_subject": 87037,
          "original_object": 87037,
          "has_quotient": 29560,
          "has_percentage": 29560,
          "has_count": 29506,
          "has_total": 29506
        },
        "subject_id_prefixes": {
          "MONDO": 84052,
          "orphanet": 1441,
          "OMIM": 1312,
          "DOID": 232
        },
        "object_id_prefixes": {
          "MONDO": 87037
        }
      },
      {
        "subject_category": [
          "biolink:Gene"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:PhenotypicFeature"
        ],
        "count": 32,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 32
        },
        "qualifiers": {
          "frequency_qualifier": 8
        },
        "attributes": {
          "id": 32,
          "category": 32,
          "negated": 32,
          "publications": 32,
          "has_evidence_of_type": 32,
          "knowledge_level": 32,
          "agent_type": 32,
          "original_subject": 32,
          "original_object": 32,
          "has_count": 8,
          "has_total": 8,
          "has_quotient": 8,
          "has_percentage": 8
        },
        "subject_id_prefixes": {
          "NCBIGene": 32
        },
        "object_id_prefixes": {
          "HP": 32
        }
      },
      {
        "subject_category": [
          "biolink:Gene"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 44,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 44
        },
        "qualifiers": {
          "frequency_qualifier": 24,
          "onset_qualifier": 2
        },
        "attributes": {
          "id": 44,
          "category": 44,
          "negated": 44,
          "publications": 44,
          "has_evidence_of_type": 44,
          "knowledge_level": 44,
          "agent_type": 44,
          "original_subject": 44,
          "original_object": 44,
          "has_count": 24,
          "has_total": 24,
          "has_quotient": 24,
          "has_percentage": 24
        },
        "subject_id_prefixes": {
          "NCBIGene": 44
        },
        "object_id_prefixes": {
          "MONDO": 44
        }
      },
      {
        "subject_category": [
          "biolink:Gene",
          "biolink:Protein"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 3,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 3
        },
        "qualifiers": {},
        "attributes": {
          "id": 3,
          "category": 3,
          "negated": 3,
          "publications": 3,
          "has_evidence_of_type": 3,
          "knowledge_level": 3,
          "agent_type": 3,
          "original_subject": 3,
          "original_object": 3
        },
        "subject_id_prefixes": {
          "NCBIGene": 3
        },
        "object_id_prefixes": {
          "MONDO": 3
        }
      },
      {
        "subject_category": [
          "biolink:Gene",
          "biolink:Protein"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:PhenotypicFeature"
        ],
        "count": 5,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 5
        },
        "qualifiers": {},
        "attributes": {
          "id": 5,
          "category": 5,
          "negated": 5,
          "publications": 5,
          "has_evidence_of_type": 5,
          "knowledge_level": 5,
          "agent_type": 5,
          "original_subject": 5,
          "original_object": 5
        },
        "subject_id_prefixes": {
          "NCBIGene": 5
        },
        "object_id_prefixes": {
          "HP": 5
        }
      },
      {
        "subject_category": [
          "biolink:Gene",
          "biolink:Protein"
        ],
        "predicate": "biolink:associated_with",
        "object_category": [
          "biolink:Gene"
        ],
        "count": 1,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 1
        },
        "qualifiers": {
          "subject_form_or_variant_qualifier": 1,
          "qualified_predicate": 1
        },
        "attributes": {
          "id": 1,
          "category": 1,
          "knowledge_level": 1,
          "agent_type": 1,
          "original_subject": 1,
          "original_object": 1
        },
        "subject_id_prefixes": {
          "NCBIGene": 1
        },
        "object_id_prefixes": {
          "NCBIGene": 1
        }
      }
    ],
    "edges_summary": {
      "total_count": 590588,
      "predicates": {
        "biolink:associated_with": 332426,
        "biolink:has_phenotype": 258162
      },
      "primary_knowledge_sources": {
        "infores:hpo-annotations": 590588
      },
      "predicates_by_knowledge_source": {
        "infores:hpo-annotations": {
          "biolink:associated_with": 332426,
          "biolink:has_phenotype": 258162
        }
      },
      "qualifiers": {
        "frequency_qualifier": 476827,
        "qualified_predicate": 332426,
        "subject_form_or_variant_qualifier": 332426,
        "disease_context_qualifier": 324912,
        "onset_qualifier": 3041,
        "sex_qualifier": 587
      },
      "attributes": {
        "id": 590588,
        "category": 590588,
        "knowledge_level": 590588,
        "agent_type": 590588,
        "original_subject": 590588,
        "original_object": 590588,
        "publications": 583074,
        "negated": 258162,
        "has_evidence_of_type": 258162,
        "has_quotient": 187383,
        "has_percentage": 187383,
        "has_count": 187140,
        "has_total": 187140
      }
    }
  }
}