Skip to content

Commit b4992a2

Browse files
committed
rare-source: add umls disease and output gene name support
1 parent 744c942 commit b4992a2

File tree

1 file changed

+76
-14
lines changed

1 file changed

+76
-14
lines changed

ncats_rare_source/smartapi.yaml

Lines changed: 76 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -309,8 +309,10 @@ paths:
309309
tags:
310310
- query
311311
x-bte-kgs-operations:
312-
- "$ref": "#/components/x-bte-kgs-operations/gene-disease"
313-
- "$ref": "#/components/x-bte-kgs-operations/disease-gene"
312+
- "$ref": "#/components/x-bte-kgs-operations/gene-diseaseOrphanet"
313+
- "$ref": "#/components/x-bte-kgs-operations/diseaseOrphanet-gene"
314+
# - "$ref": "#/components/x-bte-kgs-operations/gene-diseaseUMLS"
315+
# - "$ref": "#/components/x-bte-kgs-operations/diseaseUMLS-gene"
314316
components:
315317
parameters:
316318
callback:
@@ -571,21 +573,22 @@ components:
571573
# type: array
572574
# - type: string
573575
x-bte-kgs-operations:
574-
## look here for more details: https://raresource.nih.gov/genes/
575-
## gene ids: using entrezgene
576-
## all have entrezgene and symbol, most have hgnc (2864/2901) or ensemblgene (2863/2901)
577-
## disease ids: using orphanet
578-
## no support for gard in biolink-model or sri node normalizer right now
579-
## practically all have gard, most have orphanet (2846/2901) or omim (2774/2901) or umls (2529/2901)
580-
## some have mesh (1450/2901), very few have icd10cm (7/2901)
576+
## - look here for more details: https://raresource.nih.gov/genes/
577+
## - gene ids: using entrezgene
578+
## - all have entrezgene and symbol, most have hgnc (2864/2901) or ensemblgene (2863)
579+
## - disease ids: using orphanet and umls
580+
## - seems like all diseases have gard IDs, but there's no support in biolink-model or sri node normalizer right now
581+
## - most have orphanet (2846/2901) and the 55 that don't have orphanet seem to have umls (2529)
582+
## https://biothings.ncats.io/rare_source/query?q=NOT%20_exists_:raresource.disease.orphanet%20AND%20_exists_:raresource.disease.umls
583+
## - other ID namespaces are omim (2774), mesh (1450), very few have icd10cm (7)
581584
## available data:
582585
## - cooccurrence_url isn't indexed so I can't tell how many records have this info
583586
## format is https://raresource.nih.gov/literature/cooccurrence/WDPCP/0006866 (gene symbol, then disease gard id)
584587
## - annotation_url isn't indexed and links to resource's lit page for the gene
585588
## format is https://raresource.nih.gov/literature/gene/SDCCAG8 (gene symbol)
586589
## - raresource.disease.annotation_url isn't indexed and links to resource's lit page for the disease
587590
## format is https://raresource.nih.gov/literature/disease/0006866 (disease gard id)
588-
gene-disease:
591+
gene-diseaseOrphanet:
589592
- supportBatch: true
590593
useTemplating: true
591594
inputs:
@@ -607,11 +610,11 @@ components:
607610
predicate: gene_associated_with_condition
608611
source: "infores:rare-source"
609612
response_mapping:
610-
"$ref": "#/components/x-bte-response-mapping/disease-object"
613+
"$ref": "#/components/x-bte-response-mapping/diseaseOrphanet-object"
611614
# testExamples:
612615
# - qInput: "NCBIGene:100" ## ADA
613616
# oneOutput: "ORPHANET:39041" ## Omenn syndrome
614-
disease-gene:
617+
diseaseOrphanet-gene:
615618
- supportBatch: true
616619
useTemplating: true
617620
inputs:
@@ -627,7 +630,7 @@ components:
627630
parameters:
628631
## no prefix on output
629632
fields: >-
630-
entrezgene
633+
entrezgene,symbol
631634
size: 1000 ## size limit; adding just in case
632635
predicate: condition_associated_with_gene
633636
source: "infores:rare-source"
@@ -636,10 +639,69 @@ components:
636639
# testExamples:
637640
# - qInput: "ORPHANET:110" ## Bardet-Biedl syndrome
638641
# oneOutput: "NCBIGene:10806" ## SDCCAG8
642+
gene-diseaseUMLS:
643+
- supportBatch: true
644+
useTemplating: true
645+
inputs:
646+
- id: NCBIGene
647+
semantic: Gene
648+
requestBody:
649+
body:
650+
q: "{{ queryInputs }}" ## no prefix
651+
scopes: entrezgene
652+
outputs:
653+
- id: UMLS
654+
semantic: Disease
655+
parameters:
656+
## umls ID has no prefix
657+
fields: >-
658+
raresource.disease.umls,
659+
raresource.disease.cooccurrence_url
660+
size: 1000 ## note size limit
661+
predicate: gene_associated_with_condition
662+
source: "infores:rare-source"
663+
response_mapping:
664+
"$ref": "#/components/x-bte-response-mapping/diseaseUMLS-object"
665+
# testExamples:
666+
# - qInput: "NCBIGene:10075" ## HUWE1
667+
# oneOutput: "UMLS:C0796003" ## Intellectual developmental disorder, x-linked, syndromic, turner type
668+
diseaseUMLS-gene:
669+
- supportBatch: true
670+
useTemplating: true
671+
inputs:
672+
- id: UMLS
673+
semantic: Disease
674+
requestBody:
675+
body:
676+
q: "{{ queryInputs }}" ## no prefix
677+
scopes: raresource.disease.umls
678+
outputs:
679+
- id: NCBIGene
680+
semantic: Gene
681+
parameters:
682+
## no prefix on output
683+
fields: >-
684+
entrezgene,symbol
685+
size: 1000 ## size limit; adding just in case
686+
predicate: condition_associated_with_gene
687+
source: "infores:rare-source"
688+
response_mapping:
689+
"$ref": "#/components/x-bte-response-mapping/gene-object"
690+
# testExamples:
691+
# - qInput: "UMLS:C3887743" ## Wilms tumor 2
692+
# oneOutput: "NCBIGene:105259599" ## H19-ICR (will use output_name)
693+
## testing with "UMLS:C2675767" (Epiphyseal dysplasia, multiple, 6) ->
694+
## "NCBIGene:1297" (COL9A1) will use SRI-Node-Norm-retrieved name
639695
x-bte-response-mapping:
640-
disease-object:
696+
## didn't add names for gene -> disease. when I tried, the co-occurrence urls would appear on every Edge,
697+
## when they're supposed to show up only on the edge they correspond to
698+
diseaseOrphanet-object:
641699
ORPHANET: raresource.disease.orphanet ## no prefix
642700
"biolink:xref": raresource.disease.cooccurrence_url
643701
## this url leads to a webpage with literature supporting the gene-disease relationship
702+
diseaseUMLS-object:
703+
UMLS: raresource.disease.umls ## no prefix
704+
"biolink:xref": raresource.disease.cooccurrence_url
644705
gene-object:
645706
NCBIGene: entrezgene ## no prefix
707+
output_name: symbol ## SRI Node Norm sometimes doesn't know the NCBIGene name. Using "gene" symbol as name

0 commit comments

Comments
 (0)