{
"@id": "https://stars.renci.org/var/translator/releases/alliance/2025_12_09/",
"@type": "sc:Dataset",
"name": "alliance",
"description": "A knowledge graph built for the NCATS Biomedical Data Translator project using Translator-Ingests, Biolink Model, and Node Normalizer.",
"license": "MIT",
"url": "https://stars.renci.org/var/translator/releases/alliance/2025_12_09/",
"version": "2025_12_09",
"dateCreated": "2025_12_09",
"biolinkVersion": "4.3.5",
"babelVersion": "2025sep1",
"distribution": [
{
"@id": "alliance.tar.xz",
"@type": "cr:FileObject",
"contentUrl": "alliance.tar.xz",
"encodingFormat": "application/x-xz",
"description": "Compressed tar archive containing the KGX files: nodes.jsonl and edges.jsonl"
}
],
"isBasedOn": [
{
"id": "alliance",
"name": "Alliance of Genome Resources (AGR) Reference Ingest Guide",
"description": "The Alliance of Genome Resources (AGR) is a consortium of model organism databases and the Gene Ontology Consortium that provides a unified view of gene function, biological processes, phenotypes, and disease associations across multiple model organisms. The AGR aggregates and harmonizes data from member databases including MGI (mouse), RGD (rat), SGD (yeast), WormBase (C. elegans), FlyBase (D. melanogaster), ZFIN (zebrafish), and Xenbase (X. laevis and X. tropicalis).",
"license": {
"terms_of_use_url": "https://www.alliancegenome.org/privacy-warranty-licensing",
"license_name": "CC0 1.0 Universal",
"license_url": "https://creativecommons.org/publicdomain/zero/1.0/"
},
"url": [
"All downloads: https://www.alliancegenome.org/downloads",
"FMS (File Management System): https://fms.alliancegenome.org/download/"
],
"version": "8.2.0"
}
],
"schema": {
"nodes": [
{
"category": [
"biolink:Gene",
"biolink:Protein"
],
"count": 14148,
"id_prefixes": {
"NCBIGene": 14148
},
"attributes": {
"name": 14148,
"equivalent_identifiers": 14148,
"information_content": 13172
}
},
{
"category": [
"biolink:PhenotypicFeature"
],
"count": 29,
"id_prefixes": {
"HP": 15,
"EFO": 14
},
"attributes": {
"name": 29,
"equivalent_identifiers": 29,
"information_content": 29
}
},
{
"category": [
"biolink:Gene"
],
"count": 655,
"id_prefixes": {
"NCBIGene": 554,
"MGI": 100,
"RGD": 1
},
"attributes": {
"name": 655,
"equivalent_identifiers": 655,
"information_content": 83
}
},
{
"category": [
"biolink:Disease"
],
"count": 4,
"id_prefixes": {
"MONDO": 3,
"EFO": 1
},
"attributes": {
"name": 4,
"equivalent_identifiers": 4,
"information_content": 4
}
},
{
"category": [
"biolink:AnatomicalEntity"
],
"count": 664,
"id_prefixes": {
"UBERON": 664
},
"attributes": {
"name": 664,
"equivalent_identifiers": 664,
"information_content": 664
}
},
{
"category": [
"biolink:CellularComponent"
],
"count": 562,
"id_prefixes": {
"GO": 562
},
"attributes": {
"name": 562,
"equivalent_identifiers": 562,
"information_content": 562
}
}
],
"nodes_summary": {
"total_count": 16062,
"id_prefixes": {
"NCBIGene": 14702,
"UBERON": 664,
"GO": 562,
"MGI": 100,
"HP": 15,
"EFO": 15,
"MONDO": 3,
"RGD": 1
},
"attributes": {
"name": 16062,
"equivalent_identifiers": 16062,
"information_content": 14514
}
},
"edges": [
{
"subject_category": [
"biolink:Gene",
"biolink:Protein"
],
"predicate": "biolink:has_phenotype",
"object_category": [
"biolink:PhenotypicFeature"
],
"count": 2855,
"primary_knowledge_sources": {
"infores:mgi": 2821,
"infores:rgd": 34
},
"qualifiers": {},
"attributes": {
"id": 2855,
"category": 2855,
"publications": 2855,
"aggregator_knowledge_source": 2855,
"knowledge_level": 2855,
"agent_type": 2855,
"original_subject": 2855,
"original_object": 2855
},
"subject_id_prefixes": {
"NCBIGene": 2855
},
"object_id_prefixes": {
"EFO": 1655,
"HP": 1200
}
},
{
"subject_category": [
"biolink:Gene"
],
"predicate": "biolink:has_phenotype",
"object_category": [
"biolink:PhenotypicFeature"
],
"count": 90,
"primary_knowledge_sources": {
"infores:mgi": 88,
"infores:rgd": 2
},
"qualifiers": {},
"attributes": {
"id": 90,
"category": 90,
"publications": 90,
"aggregator_knowledge_source": 90,
"knowledge_level": 90,
"agent_type": 90,
"original_subject": 90,
"original_object": 90
},
"subject_id_prefixes": {
"MGI": 53,
"NCBIGene": 37
},
"object_id_prefixes": {
"EFO": 47,
"HP": 43
}
},
{
"subject_category": [
"biolink:Gene",
"biolink:Protein"
],
"predicate": "biolink:has_phenotype",
"object_category": [
"biolink:Disease"
],
"count": 58,
"primary_knowledge_sources": {
"infores:mgi": 56,
"infores:rgd": 2
},
"qualifiers": {},
"attributes": {
"id": 58,
"category": 58,
"publications": 58,
"aggregator_knowledge_source": 58,
"knowledge_level": 58,
"agent_type": 58,
"original_subject": 58,
"original_object": 58
},
"subject_id_prefixes": {
"NCBIGene": 58
},
"object_id_prefixes": {
"MONDO": 57,
"EFO": 1
}
},
{
"subject_category": [
"biolink:Gene"
],
"predicate": "biolink:has_phenotype",
"object_category": [
"biolink:Disease"
],
"count": 4,
"primary_knowledge_sources": {
"infores:mgi": 4
},
"qualifiers": {},
"attributes": {
"id": 4,
"category": 4,
"publications": 4,
"aggregator_knowledge_source": 4,
"knowledge_level": 4,
"agent_type": 4,
"original_subject": 4,
"original_object": 4
},
"subject_id_prefixes": {
"MGI": 4
},
"object_id_prefixes": {
"MONDO": 4
}
},
{
"subject_category": [
"biolink:Gene",
"biolink:Protein"
],
"predicate": "biolink:expressed_in",
"object_category": [
"biolink:AnatomicalEntity"
],
"count": 153915,
"primary_knowledge_sources": {
"infores:mgi": 153915
},
"qualifiers": {},
"attributes": {
"id": 153915,
"category": 153915,
"qualifiers": 153915,
"publications": 153915,
"aggregator_knowledge_source": 153915,
"knowledge_level": 153915,
"agent_type": 153915,
"original_subject": 153915,
"original_object": 153915
},
"subject_id_prefixes": {
"NCBIGene": 153915
},
"object_id_prefixes": {
"UBERON": 153915
}
},
{
"subject_category": [
"biolink:Gene"
],
"predicate": "biolink:expressed_in",
"object_category": [
"biolink:AnatomicalEntity"
],
"count": 3395,
"primary_knowledge_sources": {
"infores:mgi": 3395
},
"qualifiers": {},
"attributes": {
"id": 3395,
"category": 3395,
"qualifiers": 3395,
"publications": 3395,
"aggregator_knowledge_source": 3395,
"knowledge_level": 3395,
"agent_type": 3395,
"original_subject": 3395,
"original_object": 3395
},
"subject_id_prefixes": {
"NCBIGene": 3148,
"MGI": 247
},
"object_id_prefixes": {
"UBERON": 3395
}
},
{
"subject_category": [
"biolink:Gene",
"biolink:Protein"
],
"predicate": "biolink:expressed_in",
"object_category": [
"biolink:CellularComponent"
],
"count": 6712,
"primary_knowledge_sources": {
"infores:rgd": 6712
},
"qualifiers": {},
"attributes": {
"id": 6712,
"category": 6712,
"qualifiers": 6712,
"publications": 6712,
"aggregator_knowledge_source": 6712,
"knowledge_level": 6712,
"agent_type": 6712,
"original_subject": 6712,
"original_object": 6712
},
"subject_id_prefixes": {
"NCBIGene": 6712
},
"object_id_prefixes": {
"GO": 6712
}
},
{
"subject_category": [
"biolink:Gene"
],
"predicate": "biolink:expressed_in",
"object_category": [
"biolink:CellularComponent"
],
"count": 98,
"primary_knowledge_sources": {
"infores:rgd": 98
},
"qualifiers": {},
"attributes": {
"id": 98,
"category": 98,
"qualifiers": 98,
"publications": 98,
"aggregator_knowledge_source": 98,
"knowledge_level": 98,
"agent_type": 98,
"original_subject": 98,
"original_object": 98
},
"subject_id_prefixes": {
"NCBIGene": 97,
"RGD": 1
},
"object_id_prefixes": {
"GO": 98
}
}
],
"edges_summary": {
"total_count": 167127,
"predicates": {
"biolink:expressed_in": 164120,
"biolink:has_phenotype": 3007
},
"primary_knowledge_sources": {
"infores:mgi": 160279,
"infores:rgd": 6848
},
"predicates_by_knowledge_source": {
"infores:mgi": {
"biolink:expressed_in": 157310,
"biolink:has_phenotype": 2969
},
"infores:rgd": {
"biolink:expressed_in": 6810,
"biolink:has_phenotype": 38
}
},
"qualifiers": {},
"attributes": {
"id": 167127,
"category": 167127,
"publications": 167127,
"aggregator_knowledge_source": 167127,
"knowledge_level": 167127,
"agent_type": 167127,
"original_subject": 167127,
"original_object": 167127,
"qualifiers": 164120
}
}
}
}