{
  "@id": "https://stars.renci.org/var/translator/releases/hpoa/2025_11_13/",
  "@type": "sc:Dataset",
  "name": "hpoa",
  "description": "A knowledge graph built for the NCATS Biomedical Data Translator project using Translator-Ingests, Biolink Model, and Node Normalizer.",
  "license": "MIT",
  "url": "https://stars.renci.org/var/translator/releases/hpoa/2025_11_13/",
  "version": "2025_11_13",
  "dateCreated": "2025_11_13",
  "biolinkVersion": "4.3.4",
  "babelVersion": "2025sep1",
  "distribution": [
    {
      "@id": "hpoa.tar.xz",
      "@type": "cr:FileObject",
      "contentUrl": "hpoa.tar.xz",
      "encodingFormat": "application/x-xz",
      "description": "Compressed tar archive containing the KGX files: nodes.jsonl and edges.jsonl"
    }
  ],
  "isBasedOn": [
    {
      "id": "hpoa",
      "name": "Human Phenotype Ontology Annotations",
      "description": "The [Human Phenotype Ontology (HPO)](https://hpo.jax.org/) provides a standard vocabulary of phenotypic abnormalities encountered in human disease. Each term in the HPO describes a phenotypic abnormality, such as Atrial septal defect. The HPO is currently being developed using the medical literature, Orphanet, DECIPHER, and OMIM. HPO currently contains over 18,000 terms and over 156,000 annotations to hereditary diseases. The HPO project and others have developed software for phenotype-driven differential diagnostics, genomic diagnostics, and translational research.\nThe Human Phenotype Ontology group curates and assembles over 115,000 HPO-related annotations (\"HPOA\") to hereditary diseases using the HPO ontology. Here we create Biolink associations between diseases and phenotypic features, together with their evidence, and age of onset and frequency (if known). Disease annotations here are also cross-referenced to the MONarch Disease Ontology (MONDO) (https://mondo.monarchinitiative.org/).\nThere are four HPOA ingests ('disease-to-phenotype' (includes capture of disease modes of inheritance, 'gene-to-phenotype' and 'gene-to-disease') that parse out records from the HPO Phenotype Annotation File (http://purl.obolibrary.org/obo/hp/hpoa/phenotype.hpoa).",
      "license": {
        "terms_of_use_url": "https://hpo.jax.org/license",
        "terms_of_use_description": "Bespoke terms describing specific conditions for use of HPOA data. No formal license."
      },
      "url": [
        "https://hpo.jax.org/data/annotations"
      ],
      "version": "2025-10-22"
    }
  ],
  "schema": {
    "nodes": [
      {
        "category": [
          "biolink:Disease"
        ],
        "count": 12814,
        "id_prefixes": {
          "MONDO": 12338,
          "OMIM": 280,
          "orphanet": 166,
          "DOID": 22,
          "UMLS": 8
        },
        "attributes": {
          "name": 12814,
          "equivalent_identifiers": 12814,
          "information_content": 12393,
          "inheritance": 224
        }
      },
      {
        "category": [
          "biolink:PhenotypicFeature"
        ],
        "count": 9424,
        "id_prefixes": {
          "HP": 9424
        },
        "attributes": {
          "name": 9424,
          "equivalent_identifiers": 9424,
          "information_content": 9424
        }
      },
      {
        "category": [
          "biolink:Gene"
        ],
        "count": 107,
        "id_prefixes": {
          "NCBIGene": 107
        },
        "attributes": {
          "name": 107,
          "equivalent_identifiers": 107,
          "information_content": 61
        }
      },
      {
        "category": [
          "biolink:Protein",
          "biolink:Gene"
        ],
        "count": 5399,
        "id_prefixes": {
          "NCBIGene": 5399
        },
        "attributes": {
          "name": 5399,
          "equivalent_identifiers": 5399,
          "information_content": 5399,
          "inheritance": 1
        }
      }
    ],
    "nodes_summary": {
      "total_count": 27744,
      "id_prefixes": {
        "MONDO": 12338,
        "HP": 9424,
        "NCBIGene": 5506,
        "OMIM": 280,
        "orphanet": 166,
        "DOID": 22,
        "UMLS": 8
      },
      "attributes": {
        "name": 27744,
        "equivalent_identifiers": 27744,
        "information_content": 27277,
        "inheritance": 225
      }
    },
    "edges": [
      {
        "subject_category": [
          "biolink:Disease"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 86793,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 86793
        },
        "qualifiers": {
          "frequency_qualifier": 68411,
          "onset_qualifier": 1396,
          "sex_qualifier": 331
        },
        "attributes": {
          "id": 86793,
          "category": 86793,
          "negated": 86793,
          "publications": 86793,
          "has_evidence": 86793,
          "knowledge_level": 86793,
          "agent_type": 86793,
          "original_subject": 86793,
          "original_object": 86793,
          "has_quotient": 28040,
          "has_percentage": 28040,
          "has_count": 27985,
          "has_total": 27985
        },
        "subject_id_prefixes": {
          "MONDO": 84444,
          "orphanet": 1437,
          "OMIM": 680,
          "DOID": 232
        },
        "object_id_prefixes": {
          "MONDO": 86793
        }
      },
      {
        "subject_category": [
          "biolink:Disease"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:PhenotypicFeature"
        ],
        "count": 168397,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 168397
        },
        "qualifiers": {
          "frequency_qualifier": 134214,
          "onset_qualifier": 1640,
          "sex_qualifier": 250
        },
        "attributes": {
          "id": 168397,
          "category": 168397,
          "negated": 168397,
          "publications": 168397,
          "has_evidence": 168397,
          "knowledge_level": 168397,
          "agent_type": 168397,
          "original_subject": 168397,
          "original_object": 168397,
          "has_quotient": 56427,
          "has_percentage": 56427,
          "has_count": 56385,
          "has_total": 56385
        },
        "subject_id_prefixes": {
          "MONDO": 165524,
          "orphanet": 1944,
          "OMIM": 710,
          "DOID": 219
        },
        "object_id_prefixes": {
          "HP": 168397
        }
      },
      {
        "subject_category": [
          "biolink:Gene"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 2162,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 2162
        },
        "qualifiers": {
          "disease_context_qualifier": 2118,
          "frequency_qualifier": 1731,
          "onset_qualifier": 2
        },
        "attributes": {
          "id": 2162,
          "category": 2162,
          "publications": 2162,
          "knowledge_level": 2162,
          "agent_type": 2162,
          "original_subject": 2162,
          "original_object": 2162,
          "has_count": 483,
          "has_total": 483,
          "has_quotient": 483,
          "has_percentage": 483,
          "negated": 44,
          "has_evidence": 44
        },
        "subject_id_prefixes": {
          "NCBIGene": 2162
        },
        "object_id_prefixes": {
          "MONDO": 2159,
          "UMLS": 3
        }
      },
      {
        "subject_category": [
          "biolink:Gene"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:PhenotypicFeature"
        ],
        "count": 3891,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 3891
        },
        "qualifiers": {
          "disease_context_qualifier": 3859,
          "frequency_qualifier": 3114
        },
        "attributes": {
          "id": 3891,
          "category": 3891,
          "publications": 3891,
          "knowledge_level": 3891,
          "agent_type": 3891,
          "original_subject": 3891,
          "original_object": 3891,
          "has_quotient": 996,
          "has_percentage": 996,
          "has_count": 994,
          "has_total": 994,
          "negated": 32,
          "has_evidence": 32
        },
        "subject_id_prefixes": {
          "NCBIGene": 3891
        },
        "object_id_prefixes": {
          "HP": 3891
        }
      },
      {
        "subject_category": [
          "biolink:Protein",
          "biolink:Gene"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 116390,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 116390
        },
        "qualifiers": {
          "disease_context_qualifier": 116387,
          "frequency_qualifier": 97405
        },
        "attributes": {
          "id": 116390,
          "category": 116390,
          "publications": 116390,
          "knowledge_level": 116390,
          "agent_type": 116390,
          "original_subject": 116390,
          "original_object": 116390,
          "has_quotient": 34410,
          "has_percentage": 34410,
          "has_count": 34317,
          "has_total": 34317,
          "negated": 3,
          "has_evidence": 3
        },
        "subject_id_prefixes": {
          "NCBIGene": 116390
        },
        "object_id_prefixes": {
          "MONDO": 116280,
          "UMLS": 110
        }
      },
      {
        "subject_category": [
          "biolink:Protein",
          "biolink:Gene"
        ],
        "predicate": "biolink:has_phenotype",
        "object_category": [
          "biolink:PhenotypicFeature"
        ],
        "count": 238716,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 238716
        },
        "qualifiers": {
          "disease_context_qualifier": 238714,
          "frequency_qualifier": 191763
        },
        "attributes": {
          "id": 238716,
          "category": 238716,
          "publications": 238716,
          "knowledge_level": 238716,
          "agent_type": 238716,
          "original_subject": 238716,
          "original_object": 238716,
          "has_quotient": 81446,
          "has_percentage": 81446,
          "has_count": 81399,
          "has_total": 81399,
          "negated": 2,
          "has_evidence": 2
        },
        "subject_id_prefixes": {
          "NCBIGene": 238716
        },
        "object_id_prefixes": {
          "HP": 238716
        }
      },
      {
        "subject_category": [
          "biolink:Protein",
          "biolink:Gene"
        ],
        "predicate": "biolink:causes",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 7991,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 7991
        },
        "qualifiers": {},
        "attributes": {
          "id": 7991,
          "category": 7991,
          "knowledge_level": 7991,
          "agent_type": 7991,
          "original_subject": 7991,
          "original_object": 7991
        },
        "subject_id_prefixes": {
          "NCBIGene": 7991
        },
        "object_id_prefixes": {
          "MONDO": 7764,
          "OMIM": 203,
          "DOID": 24
        }
      },
      {
        "subject_category": [
          "biolink:Protein",
          "biolink:Gene"
        ],
        "predicate": "biolink:contributes_to",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 572,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 572
        },
        "qualifiers": {},
        "attributes": {
          "id": 572,
          "category": 572,
          "knowledge_level": 572,
          "agent_type": 572,
          "original_subject": 572,
          "original_object": 572
        },
        "subject_id_prefixes": {
          "NCBIGene": 572
        },
        "object_id_prefixes": {
          "MONDO": 512,
          "OMIM": 55,
          "DOID": 5
        }
      },
      {
        "subject_category": [
          "biolink:Gene"
        ],
        "predicate": "biolink:causes",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 123,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 123
        },
        "qualifiers": {},
        "attributes": {
          "id": 123,
          "category": 123,
          "knowledge_level": 123,
          "agent_type": 123,
          "original_subject": 123,
          "original_object": 123
        },
        "subject_id_prefixes": {
          "NCBIGene": 123
        },
        "object_id_prefixes": {
          "MONDO": 120,
          "OMIM": 3
        }
      },
      {
        "subject_category": [
          "biolink:Gene"
        ],
        "predicate": "biolink:contributes_to",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 7,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 7
        },
        "qualifiers": {},
        "attributes": {
          "id": 7,
          "category": 7,
          "knowledge_level": 7,
          "agent_type": 7,
          "original_subject": 7,
          "original_object": 7
        },
        "subject_id_prefixes": {
          "NCBIGene": 7
        },
        "object_id_prefixes": {
          "MONDO": 6,
          "OMIM": 1
        }
      },
      {
        "subject_category": [
          "biolink:Protein",
          "biolink:Gene"
        ],
        "predicate": "biolink:causes",
        "object_category": [
          "biolink:Gene"
        ],
        "count": 1,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 1
        },
        "qualifiers": {},
        "attributes": {
          "id": 1,
          "category": 1,
          "knowledge_level": 1,
          "agent_type": 1,
          "original_subject": 1,
          "original_object": 1
        },
        "subject_id_prefixes": {
          "NCBIGene": 1
        },
        "object_id_prefixes": {
          "NCBIGene": 1
        }
      },
      {
        "subject_category": [
          "biolink:Protein",
          "biolink:Gene"
        ],
        "predicate": "biolink:associated_with",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 7958,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 7958
        },
        "qualifiers": {},
        "attributes": {
          "id": 7958,
          "category": 7958,
          "knowledge_level": 7958,
          "agent_type": 7958,
          "original_subject": 7958,
          "original_object": 7958
        },
        "subject_id_prefixes": {
          "NCBIGene": 7958
        },
        "object_id_prefixes": {
          "MONDO": 7535,
          "orphanet": 423
        }
      },
      {
        "subject_category": [
          "biolink:Gene"
        ],
        "predicate": "biolink:associated_with",
        "object_category": [
          "biolink:Disease"
        ],
        "count": 143,
        "primary_knowledge_sources": {
          "infores:hpo-annotations": 143
        },
        "qualifiers": {},
        "attributes": {
          "id": 143,
          "category": 143,
          "knowledge_level": 143,
          "agent_type": 143,
          "original_subject": 143,
          "original_object": 143
        },
        "subject_id_prefixes": {
          "NCBIGene": 143
        },
        "object_id_prefixes": {
          "MONDO": 137,
          "orphanet": 6
        }
      }
    ],
    "edges_summary": {
      "total_count": 633144,
      "predicates": {
        "biolink:has_phenotype": 616349,
        "biolink:causes": 8115,
        "biolink:associated_with": 8101,
        "biolink:contributes_to": 579
      },
      "primary_knowledge_sources": {
        "infores:hpo-annotations": 633144
      },
      "predicates_by_knowledge_source": {
        "infores:hpo-annotations": {
          "biolink:has_phenotype": 616349,
          "biolink:causes": 8115,
          "biolink:associated_with": 8101,
          "biolink:contributes_to": 579
        }
      },
      "qualifiers": {
        "frequency_qualifier": 496638,
        "disease_context_qualifier": 361078,
        "onset_qualifier": 3038,
        "sex_qualifier": 581
      },
      "attributes": {
        "id": 633144,
        "category": 633144,
        "knowledge_level": 633144,
        "agent_type": 633144,
        "original_subject": 633144,
        "original_object": 633144,
        "publications": 616349,
        "negated": 255271,
        "has_evidence": 255271,
        "has_quotient": 201802,
        "has_percentage": 201802,
        "has_count": 201563,
        "has_total": 201563
      }
    }
  }
}