KGX STORAGE

graph-metadata.json
Back to Folder Download File
Size: 11.3 KB Modified: 2026-01-06 07:40:35
JSON Content
{
  "@id": "https://stars.renci.org/var/translator/releases/alliance/2026_01_05/",
  "@type": "sc:Dataset",
  "name": "alliance",
  "description": "A knowledge graph built for the NCATS Biomedical Data Translator project using Translator-Ingests, Biolink Model, and Node Normalizer.",
  "license": "MIT",
  "url": "https://stars.renci.org/var/translator/releases/alliance/2026_01_05/",
  "version": "2026_01_05",
  "dateCreated": "2026_01_05",
  "biolinkVersion": "4.3.4",
  "babelVersion": "2025sep1",
  "distribution": [
    {
      "@id": "alliance.tar.xz",
      "@type": "cr:FileObject",
      "contentUrl": "alliance.tar.xz",
      "encodingFormat": "application/x-xz",
      "description": "Compressed tar archive containing the KGX files: nodes.jsonl and edges.jsonl"
    }
  ],
  "isBasedOn": [
    {
      "id": "alliance",
      "name": "Alliance of Genome Resources (AGR) Reference Ingest Guide",
      "description": "The Alliance of Genome Resources (AGR) is a consortium of model organism databases and the Gene Ontology Consortium that provides a unified view of gene function, biological processes, phenotypes, and disease associations across multiple model organisms. The AGR aggregates and harmonizes data from member databases including MGI (mouse), RGD (rat), SGD (yeast), WormBase (C. elegans), FlyBase (D. melanogaster), ZFIN (zebrafish), and Xenbase (X. laevis and X. tropicalis).",
      "license": {
        "terms_of_use_url": "https://www.alliancegenome.org/privacy-warranty-licensing",
        "license_name": "CC0 1.0 Universal",
        "license_url": "https://creativecommons.org/publicdomain/zero/1.0/"
      },
      "url": [
        "All downloads: https://www.alliancegenome.org/downloads",
        "FMS (File Management System): https://fms.alliancegenome.org/download/"
      ],
      "version": "8.3.0"
    }
  ],
  "schema": {
    "nodes": [
      {
        "category": [
          "biolink:Gene",
          "biolink:Protein"
        ],
        "count": 14223,
        "id_prefixes": {
          "NCBIGene": 14223
        },
        "attributes": {
          "name": 14223,
          "equivalent_identifiers": 14223,
          "information_content": 13236
        }
      },
      {
        "category": [
          "biolink:PhenotypicFeature"
        ],
        "count": 29,
        "id_prefixes": {
          "HP": 15,
          "EFO": 14
        },
        "attributes": {
          "name": 29,
          "equivalent_identifiers": 29,
          "information_content": 29
        }
      },
      {
        "category": [
          "biolink:Gene"
        ],
        "count": 667,
        "id_prefixes": {
          "NCBIGene": 565,
          "MGI": 101,
          "RGD": 1
        },
        "attributes": {
          "name": 667,
          "equivalent_identifiers": 667,
          "information_content": 85
        }
      },
      {
        "category": [
          "biolink:Disease"
        ],
        "count": 4,
        "id_prefixes": {
          "MONDO": 3,
          "EFO": 1
        },
        "attributes": {
          "name": 4,
          "equivalent_identifiers": 4,
          "information_content": 4
        }
      },
      {
        "category": [
          "biolink:AnatomicalEntity"
        ],
        "count": 668,
        "id_prefixes": {
          "UBERON": 668
        },
        "attributes": {
          "name": 668,
          "equivalent_identifiers": 668,
          "information_content": 668
        }
      },
      {
        "category": [
          "biolink:CellularComponent"
        ],
        "count": 566,
        "id_prefixes": {
          "GO": 566
        },
        "attributes": {
          "name": 566,
          "equivalent_identifiers": 566,
          "information_content": 566
        }
      }
    ],
    "nodes_summary": {
      "total_count": 16157,
      "id_prefixes": {
        "NCBIGene": 14788,
        "UBERON": 668,
        "GO": 566,
        "MGI": 101,
        "HP": 15,
        "EFO": 15,
        "MONDO": 3,
        "RGD": 1
      },
      "attributes": {
        "name": 16157,
        "equivalent_identifiers": 16157,
        "information_content": 14588
      }
    },
    "edges": [
      {
        "subject_category": [
          "biolink:Gene",
          "biolink:Protein"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:PhenotypicFeature"
        ],
        "count": 2889,
        "primary_knowledge_sources": {
          "infores:mgi": 2855,
          "infores:rgd": 34
        },
        "qualifiers": {},
        "attributes": {
          "id": 2889,
          "category": 2889,
          "publications": 2889,
          "aggregator_knowledge_source": 2889,
          "knowledge_level": 2889,
          "agent_type": 2889,
          "original_subject": 2889,
          "original_object": 2889
        },
        "subject_id_prefixes": {
          "NCBIGene": 2889
        },
        "object_id_prefixes": {
          "EFO": 1668,
          "HP": 1221
        }
      },
      {
        "subject_category": [
          "biolink:Gene"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:PhenotypicFeature"
        ],
        "count": 93,
        "primary_knowledge_sources": {
          "infores:mgi": 91,
          "infores:rgd": 2
        },
        "qualifiers": {},
        "attributes": {
          "id": 93,
          "category": 93,
          "publications": 93,
          "aggregator_knowledge_source": 93,
          "knowledge_level": 93,
          "agent_type": 93,
          "original_subject": 93,
          "original_object": 93
        },
        "subject_id_prefixes": {
          "MGI": 54,
          "NCBIGene": 39
        },
        "object_id_prefixes": {
          "EFO": 50,
          "HP": 43
        }
      },
      {
        "subject_category": [
          "biolink:Gene",
          "biolink:Protein"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 58,
        "primary_knowledge_sources": {
          "infores:mgi": 56,
          "infores:rgd": 2
        },
        "qualifiers": {},
        "attributes": {
          "id": 58,
          "category": 58,
          "publications": 58,
          "aggregator_knowledge_source": 58,
          "knowledge_level": 58,
          "agent_type": 58,
          "original_subject": 58,
          "original_object": 58
        },
        "subject_id_prefixes": {
          "NCBIGene": 58
        },
        "object_id_prefixes": {
          "MONDO": 57,
          "EFO": 1
        }
      },
      {
        "subject_category": [
          "biolink:Gene"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 4,
        "primary_knowledge_sources": {
          "infores:mgi": 4
        },
        "qualifiers": {},
        "attributes": {
          "id": 4,
          "category": 4,
          "publications": 4,
          "aggregator_knowledge_source": 4,
          "knowledge_level": 4,
          "agent_type": 4,
          "original_subject": 4,
          "original_object": 4
        },
        "subject_id_prefixes": {
          "MGI": 4
        },
        "object_id_prefixes": {
          "MONDO": 4
        }
      },
      {
        "subject_category": [
          "biolink:Gene",
          "biolink:Protein"
        ],
        "predicate": "biolink:expressed_in",
        "object_category": [
          "biolink:AnatomicalEntity"
        ],
        "count": 157519,
        "primary_knowledge_sources": {
          "infores:mgi": 157519
        },
        "qualifiers": {},
        "attributes": {
          "id": 157519,
          "category": 157519,
          "qualifiers": 157519,
          "publications": 157519,
          "aggregator_knowledge_source": 157519,
          "knowledge_level": 157519,
          "agent_type": 157519,
          "original_subject": 157519,
          "original_object": 157519
        },
        "subject_id_prefixes": {
          "NCBIGene": 157519
        },
        "object_id_prefixes": {
          "UBERON": 157519
        }
      },
      {
        "subject_category": [
          "biolink:Gene"
        ],
        "predicate": "biolink:expressed_in",
        "object_category": [
          "biolink:AnatomicalEntity"
        ],
        "count": 3475,
        "primary_knowledge_sources": {
          "infores:mgi": 3475
        },
        "qualifiers": {},
        "attributes": {
          "id": 3475,
          "category": 3475,
          "qualifiers": 3475,
          "publications": 3475,
          "aggregator_knowledge_source": 3475,
          "knowledge_level": 3475,
          "agent_type": 3475,
          "original_subject": 3475,
          "original_object": 3475
        },
        "subject_id_prefixes": {
          "NCBIGene": 3209,
          "MGI": 266
        },
        "object_id_prefixes": {
          "UBERON": 3475
        }
      },
      {
        "subject_category": [
          "biolink:Gene",
          "biolink:Protein"
        ],
        "predicate": "biolink:expressed_in",
        "object_category": [
          "biolink:CellularComponent"
        ],
        "count": 6869,
        "primary_knowledge_sources": {
          "infores:rgd": 6869
        },
        "qualifiers": {},
        "attributes": {
          "id": 6869,
          "category": 6869,
          "qualifiers": 6869,
          "publications": 6869,
          "aggregator_knowledge_source": 6869,
          "knowledge_level": 6869,
          "agent_type": 6869,
          "original_subject": 6869,
          "original_object": 6869
        },
        "subject_id_prefixes": {
          "NCBIGene": 6869
        },
        "object_id_prefixes": {
          "GO": 6869
        }
      },
      {
        "subject_category": [
          "biolink:Gene"
        ],
        "predicate": "biolink:expressed_in",
        "object_category": [
          "biolink:CellularComponent"
        ],
        "count": 103,
        "primary_knowledge_sources": {
          "infores:rgd": 103
        },
        "qualifiers": {},
        "attributes": {
          "id": 103,
          "category": 103,
          "qualifiers": 103,
          "publications": 103,
          "aggregator_knowledge_source": 103,
          "knowledge_level": 103,
          "agent_type": 103,
          "original_subject": 103,
          "original_object": 103
        },
        "subject_id_prefixes": {
          "NCBIGene": 102,
          "RGD": 1
        },
        "object_id_prefixes": {
          "GO": 103
        }
      }
    ],
    "edges_summary": {
      "total_count": 171010,
      "predicates": {
        "biolink:expressed_in": 167966,
        "biolink:has_phenotype": 3044
      },
      "primary_knowledge_sources": {
        "infores:mgi": 164000,
        "infores:rgd": 7010
      },
      "predicates_by_knowledge_source": {
        "infores:mgi": {
          "biolink:expressed_in": 160994,
          "biolink:has_phenotype": 3006
        },
        "infores:rgd": {
          "biolink:expressed_in": 6972,
          "biolink:has_phenotype": 38
        }
      },
      "qualifiers": {},
      "attributes": {
        "id": 171010,
        "category": 171010,
        "publications": 171010,
        "aggregator_knowledge_source": 171010,
        "knowledge_level": 171010,
        "agent_type": 171010,
        "original_subject": 171010,
        "original_object": 171010,
        "qualifiers": 167966
      }
    }
  }
}