{
"@id": "https://stars.renci.org/var/translator/releases/alliance/2026_01_05/",
"@type": "sc:Dataset",
"name": "alliance",
"description": "A knowledge graph built for the NCATS Biomedical Data Translator project using Translator-Ingests, Biolink Model, and Node Normalizer.",
"license": "MIT",
"url": "https://stars.renci.org/var/translator/releases/alliance/2026_01_05/",
"version": "2026_01_05",
"dateCreated": "2026_01_05",
"biolinkVersion": "4.3.4",
"babelVersion": "2025sep1",
"distribution": [
{
"@id": "alliance.tar.xz",
"@type": "cr:FileObject",
"contentUrl": "alliance.tar.xz",
"encodingFormat": "application/x-xz",
"description": "Compressed tar archive containing the KGX files: nodes.jsonl and edges.jsonl"
}
],
"isBasedOn": [
{
"id": "alliance",
"name": "Alliance of Genome Resources (AGR) Reference Ingest Guide",
"description": "The Alliance of Genome Resources (AGR) is a consortium of model organism databases and the Gene Ontology Consortium that provides a unified view of gene function, biological processes, phenotypes, and disease associations across multiple model organisms. The AGR aggregates and harmonizes data from member databases including MGI (mouse), RGD (rat), SGD (yeast), WormBase (C. elegans), FlyBase (D. melanogaster), ZFIN (zebrafish), and Xenbase (X. laevis and X. tropicalis).",
"license": {
"terms_of_use_url": "https://www.alliancegenome.org/privacy-warranty-licensing",
"license_name": "CC0 1.0 Universal",
"license_url": "https://creativecommons.org/publicdomain/zero/1.0/"
},
"url": [
"All downloads: https://www.alliancegenome.org/downloads",
"FMS (File Management System): https://fms.alliancegenome.org/download/"
],
"version": "8.3.0"
}
],
"schema": {
"nodes": [
{
"category": [
"biolink:Gene",
"biolink:Protein"
],
"count": 14223,
"id_prefixes": {
"NCBIGene": 14223
},
"attributes": {
"name": 14223,
"equivalent_identifiers": 14223,
"information_content": 13236
}
},
{
"category": [
"biolink:PhenotypicFeature"
],
"count": 29,
"id_prefixes": {
"HP": 15,
"EFO": 14
},
"attributes": {
"name": 29,
"equivalent_identifiers": 29,
"information_content": 29
}
},
{
"category": [
"biolink:Gene"
],
"count": 667,
"id_prefixes": {
"NCBIGene": 565,
"MGI": 101,
"RGD": 1
},
"attributes": {
"name": 667,
"equivalent_identifiers": 667,
"information_content": 85
}
},
{
"category": [
"biolink:Disease"
],
"count": 4,
"id_prefixes": {
"MONDO": 3,
"EFO": 1
},
"attributes": {
"name": 4,
"equivalent_identifiers": 4,
"information_content": 4
}
},
{
"category": [
"biolink:AnatomicalEntity"
],
"count": 668,
"id_prefixes": {
"UBERON": 668
},
"attributes": {
"name": 668,
"equivalent_identifiers": 668,
"information_content": 668
}
},
{
"category": [
"biolink:CellularComponent"
],
"count": 566,
"id_prefixes": {
"GO": 566
},
"attributes": {
"name": 566,
"equivalent_identifiers": 566,
"information_content": 566
}
}
],
"nodes_summary": {
"total_count": 16157,
"id_prefixes": {
"NCBIGene": 14788,
"UBERON": 668,
"GO": 566,
"MGI": 101,
"HP": 15,
"EFO": 15,
"MONDO": 3,
"RGD": 1
},
"attributes": {
"name": 16157,
"equivalent_identifiers": 16157,
"information_content": 14588
}
},
"edges": [
{
"subject_category": [
"biolink:Gene",
"biolink:Protein"
],
"predicate": "biolink:has_phenotype",
"object_category": [
"biolink:PhenotypicFeature"
],
"count": 2889,
"primary_knowledge_sources": {
"infores:mgi": 2855,
"infores:rgd": 34
},
"qualifiers": {},
"attributes": {
"id": 2889,
"category": 2889,
"publications": 2889,
"aggregator_knowledge_source": 2889,
"knowledge_level": 2889,
"agent_type": 2889,
"original_subject": 2889,
"original_object": 2889
},
"subject_id_prefixes": {
"NCBIGene": 2889
},
"object_id_prefixes": {
"EFO": 1668,
"HP": 1221
}
},
{
"subject_category": [
"biolink:Gene"
],
"predicate": "biolink:has_phenotype",
"object_category": [
"biolink:PhenotypicFeature"
],
"count": 93,
"primary_knowledge_sources": {
"infores:mgi": 91,
"infores:rgd": 2
},
"qualifiers": {},
"attributes": {
"id": 93,
"category": 93,
"publications": 93,
"aggregator_knowledge_source": 93,
"knowledge_level": 93,
"agent_type": 93,
"original_subject": 93,
"original_object": 93
},
"subject_id_prefixes": {
"MGI": 54,
"NCBIGene": 39
},
"object_id_prefixes": {
"EFO": 50,
"HP": 43
}
},
{
"subject_category": [
"biolink:Gene",
"biolink:Protein"
],
"predicate": "biolink:has_phenotype",
"object_category": [
"biolink:Disease"
],
"count": 58,
"primary_knowledge_sources": {
"infores:mgi": 56,
"infores:rgd": 2
},
"qualifiers": {},
"attributes": {
"id": 58,
"category": 58,
"publications": 58,
"aggregator_knowledge_source": 58,
"knowledge_level": 58,
"agent_type": 58,
"original_subject": 58,
"original_object": 58
},
"subject_id_prefixes": {
"NCBIGene": 58
},
"object_id_prefixes": {
"MONDO": 57,
"EFO": 1
}
},
{
"subject_category": [
"biolink:Gene"
],
"predicate": "biolink:has_phenotype",
"object_category": [
"biolink:Disease"
],
"count": 4,
"primary_knowledge_sources": {
"infores:mgi": 4
},
"qualifiers": {},
"attributes": {
"id": 4,
"category": 4,
"publications": 4,
"aggregator_knowledge_source": 4,
"knowledge_level": 4,
"agent_type": 4,
"original_subject": 4,
"original_object": 4
},
"subject_id_prefixes": {
"MGI": 4
},
"object_id_prefixes": {
"MONDO": 4
}
},
{
"subject_category": [
"biolink:Gene",
"biolink:Protein"
],
"predicate": "biolink:expressed_in",
"object_category": [
"biolink:AnatomicalEntity"
],
"count": 157519,
"primary_knowledge_sources": {
"infores:mgi": 157519
},
"qualifiers": {},
"attributes": {
"id": 157519,
"category": 157519,
"qualifiers": 157519,
"publications": 157519,
"aggregator_knowledge_source": 157519,
"knowledge_level": 157519,
"agent_type": 157519,
"original_subject": 157519,
"original_object": 157519
},
"subject_id_prefixes": {
"NCBIGene": 157519
},
"object_id_prefixes": {
"UBERON": 157519
}
},
{
"subject_category": [
"biolink:Gene"
],
"predicate": "biolink:expressed_in",
"object_category": [
"biolink:AnatomicalEntity"
],
"count": 3475,
"primary_knowledge_sources": {
"infores:mgi": 3475
},
"qualifiers": {},
"attributes": {
"id": 3475,
"category": 3475,
"qualifiers": 3475,
"publications": 3475,
"aggregator_knowledge_source": 3475,
"knowledge_level": 3475,
"agent_type": 3475,
"original_subject": 3475,
"original_object": 3475
},
"subject_id_prefixes": {
"NCBIGene": 3209,
"MGI": 266
},
"object_id_prefixes": {
"UBERON": 3475
}
},
{
"subject_category": [
"biolink:Gene",
"biolink:Protein"
],
"predicate": "biolink:expressed_in",
"object_category": [
"biolink:CellularComponent"
],
"count": 6869,
"primary_knowledge_sources": {
"infores:rgd": 6869
},
"qualifiers": {},
"attributes": {
"id": 6869,
"category": 6869,
"qualifiers": 6869,
"publications": 6869,
"aggregator_knowledge_source": 6869,
"knowledge_level": 6869,
"agent_type": 6869,
"original_subject": 6869,
"original_object": 6869
},
"subject_id_prefixes": {
"NCBIGene": 6869
},
"object_id_prefixes": {
"GO": 6869
}
},
{
"subject_category": [
"biolink:Gene"
],
"predicate": "biolink:expressed_in",
"object_category": [
"biolink:CellularComponent"
],
"count": 103,
"primary_knowledge_sources": {
"infores:rgd": 103
},
"qualifiers": {},
"attributes": {
"id": 103,
"category": 103,
"qualifiers": 103,
"publications": 103,
"aggregator_knowledge_source": 103,
"knowledge_level": 103,
"agent_type": 103,
"original_subject": 103,
"original_object": 103
},
"subject_id_prefixes": {
"NCBIGene": 102,
"RGD": 1
},
"object_id_prefixes": {
"GO": 103
}
}
],
"edges_summary": {
"total_count": 171010,
"predicates": {
"biolink:expressed_in": 167966,
"biolink:has_phenotype": 3044
},
"primary_knowledge_sources": {
"infores:mgi": 164000,
"infores:rgd": 7010
},
"predicates_by_knowledge_source": {
"infores:mgi": {
"biolink:expressed_in": 160994,
"biolink:has_phenotype": 3006
},
"infores:rgd": {
"biolink:expressed_in": 6972,
"biolink:has_phenotype": 38
}
},
"qualifiers": {},
"attributes": {
"id": 171010,
"category": 171010,
"publications": 171010,
"aggregator_knowledge_source": 171010,
"knowledge_level": 171010,
"agent_type": 171010,
"original_subject": 171010,
"original_object": 171010,
"qualifiers": 167966
}
}
}
}