@@ -309,8 +309,10 @@ paths:
309
309
tags :
310
310
- query
311
311
x-bte-kgs-operations :
312
- - " $ref " : " #/components/x-bte-kgs-operations/gene-disease"
313
- - " $ref " : " #/components/x-bte-kgs-operations/disease-gene"
312
+ - " $ref " : " #/components/x-bte-kgs-operations/gene-diseaseOrphanet"
313
+ - " $ref " : " #/components/x-bte-kgs-operations/diseaseOrphanet-gene"
314
+ # - "$ref": "#/components/x-bte-kgs-operations/gene-diseaseUMLS"
315
+ # - "$ref": "#/components/x-bte-kgs-operations/diseaseUMLS-gene"
314
316
components :
315
317
parameters :
316
318
callback :
@@ -571,21 +573,22 @@ components:
571
573
# type: array
572
574
# - type: string
573
575
x-bte-kgs-operations :
574
- # # look here for more details: https://raresource.nih.gov/genes/
575
- # # gene ids: using entrezgene
576
- # # all have entrezgene and symbol, most have hgnc (2864/2901) or ensemblgene (2863/2901)
577
- # # disease ids: using orphanet
578
- # # no support for gard in biolink-model or sri node normalizer right now
579
- # # practically all have gard, most have orphanet (2846/2901) or omim (2774/2901) or umls (2529/2901)
580
- # # some have mesh (1450/2901), very few have icd10cm (7/2901)
576
+ # # - look here for more details: https://raresource.nih.gov/genes/
577
+ # # - gene ids: using entrezgene
578
+ # # - all have entrezgene and symbol, most have hgnc (2864/2901) or ensemblgene (2863)
579
+ # # - disease ids: using orphanet and umls
580
+ # # - seems like all diseases have gard IDs, but there's no support in biolink-model or sri node normalizer right now
581
+ # # - most have orphanet (2846/2901) and the 55 that don't have orphanet seem to have umls (2529)
582
+ # # https://biothings.ncats.io/rare_source/query?q=NOT%20_exists_:raresource.disease.orphanet%20AND%20_exists_:raresource.disease.umls
583
+ # # - other ID namespaces are omim (2774), mesh (1450), very few have icd10cm (7)
581
584
# # available data:
582
585
# # - cooccurrence_url isn't indexed so I can't tell how many records have this info
583
586
# # format is https://raresource.nih.gov/literature/cooccurrence/WDPCP/0006866 (gene symbol, then disease gard id)
584
587
# # - annotation_url isn't indexed and links to resource's lit page for the gene
585
588
# # format is https://raresource.nih.gov/literature/gene/SDCCAG8 (gene symbol)
586
589
# # - raresource.disease.annotation_url isn't indexed and links to resource's lit page for the disease
587
590
# # format is https://raresource.nih.gov/literature/disease/0006866 (disease gard id)
588
- gene-disease :
591
+ gene-diseaseOrphanet :
589
592
- supportBatch : true
590
593
useTemplating : true
591
594
inputs :
@@ -607,11 +610,11 @@ components:
607
610
predicate : gene_associated_with_condition
608
611
source : " infores:rare-source"
609
612
response_mapping :
610
- " $ref " : " #/components/x-bte-response-mapping/disease -object"
613
+ " $ref " : " #/components/x-bte-response-mapping/diseaseOrphanet -object"
611
614
# testExamples:
612
615
# - qInput: "NCBIGene:100" ## ADA
613
616
# oneOutput: "ORPHANET:39041" ## Omenn syndrome
614
- disease -gene :
617
+ diseaseOrphanet -gene :
615
618
- supportBatch : true
616
619
useTemplating : true
617
620
inputs :
@@ -627,7 +630,7 @@ components:
627
630
parameters :
628
631
# # no prefix on output
629
632
fields : >-
630
- entrezgene
633
+ entrezgene,symbol
631
634
size : 1000 # # size limit; adding just in case
632
635
predicate : condition_associated_with_gene
633
636
source : " infores:rare-source"
@@ -636,10 +639,69 @@ components:
636
639
# testExamples:
637
640
# - qInput: "ORPHANET:110" ## Bardet-Biedl syndrome
638
641
# oneOutput: "NCBIGene:10806" ## SDCCAG8
642
+ gene-diseaseUMLS :
643
+ - supportBatch : true
644
+ useTemplating : true
645
+ inputs :
646
+ - id : NCBIGene
647
+ semantic : Gene
648
+ requestBody :
649
+ body :
650
+ q : " {{ queryInputs }}" # # no prefix
651
+ scopes : entrezgene
652
+ outputs :
653
+ - id : UMLS
654
+ semantic : Disease
655
+ parameters :
656
+ # # umls ID has no prefix
657
+ fields : >-
658
+ raresource.disease.umls,
659
+ raresource.disease.cooccurrence_url
660
+ size : 1000 # # note size limit
661
+ predicate : gene_associated_with_condition
662
+ source : " infores:rare-source"
663
+ response_mapping :
664
+ " $ref " : " #/components/x-bte-response-mapping/diseaseUMLS-object"
665
+ # testExamples:
666
+ # - qInput: "NCBIGene:10075" ## HUWE1
667
+ # oneOutput: "UMLS:C0796003" ## Intellectual developmental disorder, x-linked, syndromic, turner type
668
+ diseaseUMLS-gene :
669
+ - supportBatch : true
670
+ useTemplating : true
671
+ inputs :
672
+ - id : UMLS
673
+ semantic : Disease
674
+ requestBody :
675
+ body :
676
+ q : " {{ queryInputs }}" # # no prefix
677
+ scopes : raresource.disease.umls
678
+ outputs :
679
+ - id : NCBIGene
680
+ semantic : Gene
681
+ parameters :
682
+ # # no prefix on output
683
+ fields : >-
684
+ entrezgene,symbol
685
+ size : 1000 # # size limit; adding just in case
686
+ predicate : condition_associated_with_gene
687
+ source : " infores:rare-source"
688
+ response_mapping :
689
+ " $ref " : " #/components/x-bte-response-mapping/gene-object"
690
+ # testExamples:
691
+ # - qInput: "UMLS:C3887743" ## Wilms tumor 2
692
+ # oneOutput: "NCBIGene:105259599" ## H19-ICR (will use output_name)
693
+ # # testing with "UMLS:C2675767" (Epiphyseal dysplasia, multiple, 6) ->
694
+ # # "NCBIGene:1297" (COL9A1) will use SRI-Node-Norm-retrieved name
639
695
x-bte-response-mapping :
640
- disease-object :
696
+ # # didn't add names for gene -> disease. when I tried, the co-occurrence urls would appear on every Edge,
697
+ # # when they're supposed to show up only on the edge they correspond to
698
+ diseaseOrphanet-object :
641
699
ORPHANET : raresource.disease.orphanet # # no prefix
642
700
" biolink:xref " : raresource.disease.cooccurrence_url
643
701
# # this url leads to a webpage with literature supporting the gene-disease relationship
702
+ diseaseUMLS-object :
703
+ UMLS : raresource.disease.umls # # no prefix
704
+ " biolink:xref " : raresource.disease.cooccurrence_url
644
705
gene-object :
645
706
NCBIGene : entrezgene # # no prefix
707
+ output_name : symbol # # SRI Node Norm sometimes doesn't know the NCBIGene name. Using "gene" symbol as name
0 commit comments