KGX STORAGE

graph-metadata.json
Back to Folder Download File
Size: 11.3 KB Modified: 2026-01-03 03:26:24
JSON Content
{
  "@id": "https://stars.renci.org/var/translator/releases/alliance/2025_12_09/",
  "@type": "sc:Dataset",
  "name": "alliance",
  "description": "A knowledge graph built for the NCATS Biomedical Data Translator project using Translator-Ingests, Biolink Model, and Node Normalizer.",
  "license": "MIT",
  "url": "https://stars.renci.org/var/translator/releases/alliance/2025_12_09/",
  "version": "2025_12_09",
  "dateCreated": "2025_12_09",
  "biolinkVersion": "4.3.5",
  "babelVersion": "2025sep1",
  "distribution": [
    {
      "@id": "alliance.tar.xz",
      "@type": "cr:FileObject",
      "contentUrl": "alliance.tar.xz",
      "encodingFormat": "application/x-xz",
      "description": "Compressed tar archive containing the KGX files: nodes.jsonl and edges.jsonl"
    }
  ],
  "isBasedOn": [
    {
      "id": "alliance",
      "name": "Alliance of Genome Resources (AGR) Reference Ingest Guide",
      "description": "The Alliance of Genome Resources (AGR) is a consortium of model organism databases and the Gene Ontology Consortium that provides a unified view of gene function, biological processes, phenotypes, and disease associations across multiple model organisms. The AGR aggregates and harmonizes data from member databases including MGI (mouse), RGD (rat), SGD (yeast), WormBase (C. elegans), FlyBase (D. melanogaster), ZFIN (zebrafish), and Xenbase (X. laevis and X. tropicalis).",
      "license": {
        "terms_of_use_url": "https://www.alliancegenome.org/privacy-warranty-licensing",
        "license_name": "CC0 1.0 Universal",
        "license_url": "https://creativecommons.org/publicdomain/zero/1.0/"
      },
      "url": [
        "All downloads: https://www.alliancegenome.org/downloads",
        "FMS (File Management System): https://fms.alliancegenome.org/download/"
      ],
      "version": "8.2.0"
    }
  ],
  "schema": {
    "nodes": [
      {
        "category": [
          "biolink:Gene",
          "biolink:Protein"
        ],
        "count": 14148,
        "id_prefixes": {
          "NCBIGene": 14148
        },
        "attributes": {
          "name": 14148,
          "equivalent_identifiers": 14148,
          "information_content": 13172
        }
      },
      {
        "category": [
          "biolink:PhenotypicFeature"
        ],
        "count": 29,
        "id_prefixes": {
          "HP": 15,
          "EFO": 14
        },
        "attributes": {
          "name": 29,
          "equivalent_identifiers": 29,
          "information_content": 29
        }
      },
      {
        "category": [
          "biolink:Gene"
        ],
        "count": 655,
        "id_prefixes": {
          "NCBIGene": 554,
          "MGI": 100,
          "RGD": 1
        },
        "attributes": {
          "name": 655,
          "equivalent_identifiers": 655,
          "information_content": 83
        }
      },
      {
        "category": [
          "biolink:Disease"
        ],
        "count": 4,
        "id_prefixes": {
          "MONDO": 3,
          "EFO": 1
        },
        "attributes": {
          "name": 4,
          "equivalent_identifiers": 4,
          "information_content": 4
        }
      },
      {
        "category": [
          "biolink:AnatomicalEntity"
        ],
        "count": 664,
        "id_prefixes": {
          "UBERON": 664
        },
        "attributes": {
          "name": 664,
          "equivalent_identifiers": 664,
          "information_content": 664
        }
      },
      {
        "category": [
          "biolink:CellularComponent"
        ],
        "count": 562,
        "id_prefixes": {
          "GO": 562
        },
        "attributes": {
          "name": 562,
          "equivalent_identifiers": 562,
          "information_content": 562
        }
      }
    ],
    "nodes_summary": {
      "total_count": 16062,
      "id_prefixes": {
        "NCBIGene": 14702,
        "UBERON": 664,
        "GO": 562,
        "MGI": 100,
        "HP": 15,
        "EFO": 15,
        "MONDO": 3,
        "RGD": 1
      },
      "attributes": {
        "name": 16062,
        "equivalent_identifiers": 16062,
        "information_content": 14514
      }
    },
    "edges": [
      {
        "subject_category": [
          "biolink:Gene",
          "biolink:Protein"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:PhenotypicFeature"
        ],
        "count": 2855,
        "primary_knowledge_sources": {
          "infores:mgi": 2821,
          "infores:rgd": 34
        },
        "qualifiers": {},
        "attributes": {
          "id": 2855,
          "category": 2855,
          "publications": 2855,
          "aggregator_knowledge_source": 2855,
          "knowledge_level": 2855,
          "agent_type": 2855,
          "original_subject": 2855,
          "original_object": 2855
        },
        "subject_id_prefixes": {
          "NCBIGene": 2855
        },
        "object_id_prefixes": {
          "EFO": 1655,
          "HP": 1200
        }
      },
      {
        "subject_category": [
          "biolink:Gene"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:PhenotypicFeature"
        ],
        "count": 90,
        "primary_knowledge_sources": {
          "infores:mgi": 88,
          "infores:rgd": 2
        },
        "qualifiers": {},
        "attributes": {
          "id": 90,
          "category": 90,
          "publications": 90,
          "aggregator_knowledge_source": 90,
          "knowledge_level": 90,
          "agent_type": 90,
          "original_subject": 90,
          "original_object": 90
        },
        "subject_id_prefixes": {
          "MGI": 53,
          "NCBIGene": 37
        },
        "object_id_prefixes": {
          "EFO": 47,
          "HP": 43
        }
      },
      {
        "subject_category": [
          "biolink:Gene",
          "biolink:Protein"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 58,
        "primary_knowledge_sources": {
          "infores:mgi": 56,
          "infores:rgd": 2
        },
        "qualifiers": {},
        "attributes": {
          "id": 58,
          "category": 58,
          "publications": 58,
          "aggregator_knowledge_source": 58,
          "knowledge_level": 58,
          "agent_type": 58,
          "original_subject": 58,
          "original_object": 58
        },
        "subject_id_prefixes": {
          "NCBIGene": 58
        },
        "object_id_prefixes": {
          "MONDO": 57,
          "EFO": 1
        }
      },
      {
        "subject_category": [
          "biolink:Gene"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 4,
        "primary_knowledge_sources": {
          "infores:mgi": 4
        },
        "qualifiers": {},
        "attributes": {
          "id": 4,
          "category": 4,
          "publications": 4,
          "aggregator_knowledge_source": 4,
          "knowledge_level": 4,
          "agent_type": 4,
          "original_subject": 4,
          "original_object": 4
        },
        "subject_id_prefixes": {
          "MGI": 4
        },
        "object_id_prefixes": {
          "MONDO": 4
        }
      },
      {
        "subject_category": [
          "biolink:Gene",
          "biolink:Protein"
        ],
        "predicate": "biolink:expressed_in",
        "object_category": [
          "biolink:AnatomicalEntity"
        ],
        "count": 153915,
        "primary_knowledge_sources": {
          "infores:mgi": 153915
        },
        "qualifiers": {},
        "attributes": {
          "id": 153915,
          "category": 153915,
          "qualifiers": 153915,
          "publications": 153915,
          "aggregator_knowledge_source": 153915,
          "knowledge_level": 153915,
          "agent_type": 153915,
          "original_subject": 153915,
          "original_object": 153915
        },
        "subject_id_prefixes": {
          "NCBIGene": 153915
        },
        "object_id_prefixes": {
          "UBERON": 153915
        }
      },
      {
        "subject_category": [
          "biolink:Gene"
        ],
        "predicate": "biolink:expressed_in",
        "object_category": [
          "biolink:AnatomicalEntity"
        ],
        "count": 3395,
        "primary_knowledge_sources": {
          "infores:mgi": 3395
        },
        "qualifiers": {},
        "attributes": {
          "id": 3395,
          "category": 3395,
          "qualifiers": 3395,
          "publications": 3395,
          "aggregator_knowledge_source": 3395,
          "knowledge_level": 3395,
          "agent_type": 3395,
          "original_subject": 3395,
          "original_object": 3395
        },
        "subject_id_prefixes": {
          "NCBIGene": 3148,
          "MGI": 247
        },
        "object_id_prefixes": {
          "UBERON": 3395
        }
      },
      {
        "subject_category": [
          "biolink:Gene",
          "biolink:Protein"
        ],
        "predicate": "biolink:expressed_in",
        "object_category": [
          "biolink:CellularComponent"
        ],
        "count": 6712,
        "primary_knowledge_sources": {
          "infores:rgd": 6712
        },
        "qualifiers": {},
        "attributes": {
          "id": 6712,
          "category": 6712,
          "qualifiers": 6712,
          "publications": 6712,
          "aggregator_knowledge_source": 6712,
          "knowledge_level": 6712,
          "agent_type": 6712,
          "original_subject": 6712,
          "original_object": 6712
        },
        "subject_id_prefixes": {
          "NCBIGene": 6712
        },
        "object_id_prefixes": {
          "GO": 6712
        }
      },
      {
        "subject_category": [
          "biolink:Gene"
        ],
        "predicate": "biolink:expressed_in",
        "object_category": [
          "biolink:CellularComponent"
        ],
        "count": 98,
        "primary_knowledge_sources": {
          "infores:rgd": 98
        },
        "qualifiers": {},
        "attributes": {
          "id": 98,
          "category": 98,
          "qualifiers": 98,
          "publications": 98,
          "aggregator_knowledge_source": 98,
          "knowledge_level": 98,
          "agent_type": 98,
          "original_subject": 98,
          "original_object": 98
        },
        "subject_id_prefixes": {
          "NCBIGene": 97,
          "RGD": 1
        },
        "object_id_prefixes": {
          "GO": 98
        }
      }
    ],
    "edges_summary": {
      "total_count": 167127,
      "predicates": {
        "biolink:expressed_in": 164120,
        "biolink:has_phenotype": 3007
      },
      "primary_knowledge_sources": {
        "infores:mgi": 160279,
        "infores:rgd": 6848
      },
      "predicates_by_knowledge_source": {
        "infores:mgi": {
          "biolink:expressed_in": 157310,
          "biolink:has_phenotype": 2969
        },
        "infores:rgd": {
          "biolink:expressed_in": 6810,
          "biolink:has_phenotype": 38
        }
      },
      "qualifiers": {},
      "attributes": {
        "id": 167127,
        "category": 167127,
        "publications": 167127,
        "aggregator_knowledge_source": 167127,
        "knowledge_level": 167127,
        "agent_type": 167127,
        "original_subject": 167127,
        "original_object": 167127,
        "qualifiers": 164120
      }
    }
  }
}