Closed saramsey closed 1 year ago
From this Cypher query (against KG2.7.4pre Neo4j server):
match (n)-[r:`biolink:biomarker_for` {original_predicate: 'SEMMEDDB:diagnoses'}]->(m) return distinct n.category, m.category, count(*) as c order by c desc;
we get the following results (note that your browser window may need to be wide in order to see the numeric column on the right):
n.category | m.category | c |
---|---|---|
"biolink:Procedure" | "biolink:Disease" | 177684 |
"biolink:Procedure" | "biolink:DiseaseOrPhenotypicFeature" | 28042 |
"biolink:Cohort" | "biolink:Disease" | 20671 |
"biolink:Procedure" | "biolink:NamedThing" | 8934 |
"biolink:NamedThing" | "biolink:Disease" | 7347 |
"biolink:Procedure" | "biolink:OrganismTaxon" | 7049 |
"biolink:Procedure" | "biolink:PhenotypicFeature" | 3665 |
"biolink:Activity" | "biolink:Disease" | 2230 |
"biolink:PhenotypicFeature" | "biolink:Disease" | 1715 |
"biolink:Cohort" | "biolink:PhenotypicFeature" | 1510 |
"biolink:Procedure" | "biolink:BiologicalEntity" | 1171 |
"biolink:NamedThing" | "biolink:DiseaseOrPhenotypicFeature" | 1072 |
"biolink:Procedure" | "biolink:InformationContentEntity" | 1043 |
"biolink:DiseaseOrPhenotypicFeature" | "biolink:Disease" | 861 |
"biolink:Device" | "biolink:OrganismTaxon" | 779 |
"biolink:InformationContentEntity" | "biolink:Disease" | 642 |
"biolink:Cohort" | "biolink:DiseaseOrPhenotypicFeature" | 637 |
"biolink:Cohort" | "biolink:NamedThing" | 570 |
"biolink:PopulationOfIndividualOrganisms" | "biolink:Disease" | 564 |
"biolink:Phenomenon" | "biolink:Disease" | 548 |
"biolink:Publication" | "biolink:Disease" | 485 |
"biolink:Activity" | "biolink:DiseaseOrPhenotypicFeature" | 426 |
"biolink:PhysiologicalProcess" | "biolink:Disease" | 406 |
"biolink:Procedure" | "biolink:Phenomenon" | 362 |
"biolink:Procedure" | "biolink:PhysiologicalProcess" | 333 |
"biolink:Agent" | "biolink:Disease" | 288 |
"biolink:NamedThing" | "biolink:NamedThing" | 268 |
"biolink:NamedThing" | "biolink:OrganismTaxon" | 257 |
"biolink:Disease" | "biolink:Disease" | 226 |
"biolink:NamedThing" | "biolink:PhenotypicFeature" | 202 |
"biolink:Procedure" | "biolink:Procedure" | 201 |
"biolink:Activity" | "biolink:NamedThing" | 115 |
"biolink:Procedure" | "biolink:Activity" | 107 |
"biolink:Publication" | "biolink:DiseaseOrPhenotypicFeature" | 106 |
"biolink:Procedure" | "biolink:Behavior" | 105 |
"biolink:Phenomenon" | "biolink:DiseaseOrPhenotypicFeature" | 94 |
"biolink:InformationContentEntity" | "biolink:DiseaseOrPhenotypicFeature" | 93 |
"biolink:PhysicalEntity" | "biolink:OrganismTaxon" | 90 |
"biolink:PhysiologicalProcess" | "biolink:DiseaseOrPhenotypicFeature" | 83 |
"biolink:PhysiologicalProcess" | "biolink:OrganismTaxon" | 78 |
"biolink:Procedure" | "biolink:PopulationOfIndividualOrganisms" | 71 |
"biolink:Activity" | "biolink:PhenotypicFeature" | 69 |
"biolink:Publication" | "biolink:PhenotypicFeature" | 69 |
"biolink:PhenotypicFeature" | "biolink:NamedThing" | 69 |
"biolink:PopulationOfIndividualOrganisms" | "biolink:PhenotypicFeature" | 63 |
"biolink:Cohort" | "biolink:BiologicalEntity" | 54 |
"biolink:Cohort" | "biolink:Behavior" | 53 |
"biolink:Procedure" | "biolink:AnatomicalEntity" | 52 |
"biolink:Device" | "biolink:Disease" | 51 |
"biolink:DiseaseOrPhenotypicFeature" | "biolink:DiseaseOrPhenotypicFeature" | 50 |
"biolink:NamedThing" | "biolink:BiologicalEntity" | 49 |
"biolink:InformationContentEntity" | "biolink:PhenotypicFeature" | 49 |
"biolink:NamedThing" | "biolink:InformationContentEntity" | 45 |
"biolink:Activity" | "biolink:OrganismTaxon" | 42 |
"biolink:PopulationOfIndividualOrganisms" | "biolink:DiseaseOrPhenotypicFeature" | 36 |
"biolink:DiseaseOrPhenotypicFeature" | "biolink:NamedThing" | 35 |
"biolink:Procedure" | "biolink:GrossAnatomicalStructure" | 32 |
"biolink:PhysiologicalProcess" | "biolink:NamedThing" | 32 |
"biolink:ChemicalEntity" | "biolink:Disease" | 31 |
"biolink:InformationContentEntity" | "biolink:NamedThing" | 31 |
"biolink:Procedure" | "biolink:CellularComponent" | 30 |
"biolink:Procedure" | "biolink:Cohort" | 29 |
"biolink:Procedure" | "biolink:ChemicalEntity" | 28 |
"biolink:PhysiologicalProcess" | "biolink:PhenotypicFeature" | 27 |
"biolink:Publication" | "biolink:NamedThing" | 27 |
"biolink:Cohort" | "biolink:InformationContentEntity" | 27 |
"biolink:Procedure" | "biolink:Publication" | 26 |
"biolink:InformationContentEntity" | "biolink:OrganismTaxon" | 25 |
"biolink:Activity" | "biolink:InformationContentEntity" | 24 |
"biolink:Phenomenon" | "biolink:PhenotypicFeature" | 22 |
"biolink:Procedure" | "biolink:IndividualOrganism" | 22 |
"biolink:NamedThing" | "biolink:PhysiologicalProcess" | 21 |
"biolink:PopulationOfIndividualOrganisms" | "biolink:NamedThing" | 21 |
"biolink:Phenomenon" | "biolink:NamedThing" | 21 |
"biolink:PhenotypicFeature" | "biolink:DiseaseOrPhenotypicFeature" | 20 |
"biolink:Activity" | "biolink:BiologicalEntity" | 18 |
"biolink:Cohort" | "biolink:PhysiologicalProcess" | 15 |
"biolink:Agent" | "biolink:PhenotypicFeature" | 15 |
"biolink:Phenomenon" | "biolink:OrganismTaxon" | 15 |
"biolink:NamedThing" | "biolink:Phenomenon" | 15 |
"biolink:InformationContentEntity" | "biolink:InformationContentEntity" | 13 |
"biolink:Disease" | "biolink:DiseaseOrPhenotypicFeature" | 13 |
"biolink:Phenomenon" | "biolink:InformationContentEntity" | 11 |
"biolink:Procedure" | "biolink:Event" | 11 |
"biolink:Agent" | "biolink:DiseaseOrPhenotypicFeature" | 10 |
"biolink:Procedure" | "biolink:Cell" | 9 |
"biolink:Device" | "biolink:DiseaseOrPhenotypicFeature" | 9 |
"biolink:ChemicalEntity" | "biolink:DiseaseOrPhenotypicFeature" | 8 |
"biolink:Procedure" | "biolink:NucleicAcidEntity" | 7 |
"biolink:InformationContentEntity" | "biolink:BiologicalEntity" | 7 |
"biolink:IndividualOrganism" | "biolink:Disease" | 6 |
"biolink:Gene" | "biolink:Disease" | 6 |
"biolink:Activity" | "biolink:Phenomenon" | 6 |
"biolink:Device" | "biolink:NamedThing" | 6 |
"biolink:Cohort" | "biolink:Procedure" | 6 |
"biolink:NamedThing" | "biolink:Procedure" | 6 |
"biolink:Disease" | "biolink:NamedThing" | 6 |
"biolink:NamedThing" | "biolink:GrossAnatomicalStructure" | 5 |
"biolink:PopulationOfIndividualOrganisms" | "biolink:Behavior" | 5 |
"biolink:NucleicAcidEntity" | "biolink:Disease" | 5 |
"biolink:Activity" | "biolink:Procedure" | 5 |
"biolink:InformationContentEntity" | "biolink:Phenomenon" | 5 |
"biolink:PhysiologicalProcess" | "biolink:InformationContentEntity" | 5 |
"biolink:Publication" | "biolink:Cohort" | 5 |
"biolink:Phenomenon" | "biolink:BiologicalEntity" | 5 |
"biolink:Activity" | "biolink:Activity" | 5 |
"biolink:NamedThing" | "biolink:PopulationOfIndividualOrganisms" | 5 |
"biolink:PhenotypicFeature" | "biolink:InformationContentEntity" | 5 |
"biolink:Cohort" | "biolink:GrossAnatomicalStructure" | 5 |
"biolink:Activity" | "biolink:PhysiologicalProcess" | 4 |
"biolink:OrganismTaxon" | "biolink:Disease" | 4 |
"biolink:ChemicalEntity" | "biolink:OrganismTaxon" | 4 |
"biolink:PhysiologicalProcess" | "biolink:BiologicalEntity" | 4 |
"biolink:NamedThing" | "biolink:Activity" | 4 |
"biolink:Activity" | "biolink:Behavior" | 3 |
"biolink:NamedThing" | "biolink:Behavior" | 3 |
"biolink:Cohort" | "biolink:Phenomenon" | 3 |
"biolink:PhysiologicalProcess" | "biolink:PhysiologicalProcess" | 3 |
"biolink:InformationContentEntity" | "biolink:Behavior" | 3 |
"biolink:Polypeptide" | "biolink:Disease" | 3 |
"biolink:AnatomicalEntity" | "biolink:OrganismTaxon" | 3 |
"biolink:DiseaseOrPhenotypicFeature" | "biolink:OrganismTaxon" | 3 |
"biolink:AnatomicalEntity" | "biolink:Disease" | 3 |
"biolink:Cohort" | "biolink:IndividualOrganism" | 3 |
"biolink:Publication" | "biolink:Phenomenon" | 3 |
"biolink:Activity" | "biolink:PopulationOfIndividualOrganisms" | 3 |
"biolink:Publication" | "biolink:Activity" | 3 |
"biolink:Agent" | "biolink:NamedThing" | 3 |
"biolink:DiseaseOrPhenotypicFeature" | "biolink:Behavior" | 2 |
"biolink:InformationContentEntity" | "biolink:PhysiologicalProcess" | 2 |
"biolink:Device" | "biolink:PhenotypicFeature" | 2 |
"biolink:DiseaseOrPhenotypicFeature" | "biolink:PhenotypicFeature" | 2 |
"biolink:Publication" | "biolink:OrganismTaxon" | 2 |
"biolink:NamedThing" | "biolink:CellularComponent" | 2 |
"biolink:NamedThing" | "biolink:AnatomicalEntity" | 2 |
"biolink:NamedThing" | "biolink:Cohort" | 2 |
"biolink:Phenomenon" | "biolink:Behavior" | 2 |
"biolink:Publication" | "biolink:PhysiologicalProcess" | 2 |
"biolink:DiseaseOrPhenotypicFeature" | "biolink:InformationContentEntity" | 2 |
"biolink:Cohort" | "biolink:Activity" | 2 |
"biolink:Disease" | "biolink:Behavior" | 1 |
"biolink:Agent" | "biolink:Behavior" | 1 |
"biolink:Publication" | "biolink:Behavior" | 1 |
"biolink:PopulationOfIndividualOrganisms" | "biolink:Phenomenon" | 1 |
"biolink:DiseaseOrPhenotypicFeature" | "biolink:PhysiologicalProcess" | 1 |
"biolink:PopulationOfIndividualOrganisms" | "biolink:PhysiologicalProcess" | 1 |
"biolink:Disease" | "biolink:PhenotypicFeature" | 1 |
"biolink:AnatomicalEntity" | "biolink:DiseaseOrPhenotypicFeature" | 1 |
"biolink:Phenomenon" | "biolink:Phenomenon" | 1 |
"biolink:Device" | "biolink:ChemicalEntity" | 1 |
"biolink:InformationContentEntity" | "biolink:CellularComponent" | 1 |
"biolink:Activity" | "biolink:AnatomicalEntity" | 1 |
"biolink:Phenomenon" | "biolink:AnatomicalEntity" | 1 |
"biolink:Cohort" | "biolink:AnatomicalEntity" | 1 |
"biolink:InformationContentEntity" | "biolink:AnatomicalEntity" | 1 |
"biolink:Phenomenon" | "biolink:Cohort" | 1 |
"biolink:PhysiologicalProcess" | "biolink:Cohort" | 1 |
"biolink:Phenomenon" | "biolink:PhysiologicalProcess" | 1 |
"biolink:Device" | "biolink:PhysiologicalProcess" | 1 |
"biolink:PhysiologicalProcess" | "biolink:Phenomenon" | 1 |
"biolink:PhysiologicalProcess" | "biolink:Behavior" | 1 |
"biolink:NamedThing" | "biolink:NucleicAcidEntity" | 1 |
"biolink:Cohort" | "biolink:NucleicAcidEntity" | 1 |
"biolink:Publication" | "biolink:PopulationOfIndividualOrganisms" | 1 |
"biolink:Phenomenon" | "biolink:PopulationOfIndividualOrganisms" | 1 |
"biolink:Agent" | "biolink:InformationContentEntity" | 1 |
"biolink:PopulationOfIndividualOrganisms" | "biolink:GrossAnatomicalStructure" | 1 |
"biolink:Phenomenon" | "biolink:GrossAnatomicalStructure" | 1 |
"biolink:InformationContentEntity" | "biolink:Activity" | 1 |
"biolink:DiseaseOrPhenotypicFeature" | "biolink:BiologicalEntity" | 1 |
"biolink:Publication" | "biolink:InformationContentEntity" | 1 |
"biolink:ChemicalEntity" | "biolink:NamedThing" | 1 |
I have logged an issue in the Biolink GitHub project, to request that the relation mapping be updated so that SEMMEDDB:diagnoses
would map to biolink:diagnoses
.
So this has been fixed in both Biolink and in RTX-KG2. Closing it out.
This issue came to light investigating RTX issue 1774, which was first reported by @dkoslicki.
On the KG2.7.4pre Neo4j database server
kg2endpoint3.rtx.ai
, when I run this Cypher command,I see that most of the subject nodes in the matching triples are really procedures and not molecular biomarkers. So I think we need to rethink this particular predicate mapping.