forked from datacommonsorg/schema
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathgenome_annotation.mcf
1832 lines (1589 loc) · 91.1 KB
/
genome_annotation.mcf
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
# Classes
Node: dcid:Allele
typeOf: schema:Class
subClassOf: dcs:GenomeAnnotation
name: "Allele"
Node: dcid:BasePairs
typeOf: dcs:UnitOfMeasure
name: "BasePairs"
subClassOf: dcs:GenomeAnnotation
description: "The number of pairs of complementary bases in a double-stranded nucleic acid molecule (DNA), consisting of a purine in one strand linked by hydrogen bonds to a pyrimidine in the other."
Node: dcid:Chromosome
name: "Chromosome"
typeOf: schema:Class
subClassOf: dcs:GenomeAnnotation
description: "A threadlike structure of nucleic acids and protein found in the nucleus of most living cells, carrying genetic information in the form of genes."
Node: dcid:Gene
name: "Gene"
typeOf: schema:Class
subClassOf: dcs:GenomeAnnotation
description: "Gene symbol of a gene, which is the basic hereditary unit of life."
descriptionUrl: "https://bioportal.bioontology.org/ontologies/OGG"
Node: dcid:GeneGeneAssociation
name: "GeneGeneAssociation"
typeOf: schema:Class
subClassOf: dcs:GeneticAssociation
description: "The association between two genes."
Node: dcid:GeneGeneticVariantAssociation
name: "GeneGeneticVariantAssociation"
typeOf: schema:Class
subClassOf: dcs:GeneticAssoication
description: "The association between a gene and a genetic variant. This association is typically tissue-specific."
Node: dcid:GeneticAssociation
name: "GeneticAssociation"
typeOf: schema:Class
subClassOf: dcs:Association,dcs:GenomeAnnotation
description: "Association between a genome annotation and another entity type."
Node: dcid:GeneticVariant
name: "GeneticVariant"
typeOf: schema:Class
subClassOf: dcs:GenomeAnnotation
description: "A single-nucleotide polymorphism, which is a substitution of a single nucleotide that occurs at a specific position in the genome, where each variation is present to some appreciable degree within a population. These are defined by dbSNP and includes small indels as well."
descriptionUrl: "http://rohsdb.usc.edu/GBshape/cgi-bin/hgTables?db=hg19&hgta_group=varRep&hgta_track=snp137&hgta_table=snp137&hgta_doSchema=describe+table+schema"
Node: dcid:GeneticVariantGeneticVariantAssociation
name: "GeneticVariantGeneticVariantAssociation"
typeOf: schema:Class
subClassOf: dcs:GeneticAssociation
description: "The association between two genetic variants."
Node: dcid:GenomeAnnotation
name: "GenomeAnnotation"
typeOf: schema:Class
subClassOf: dcs:BiologicalEntity
description: "Entities or properties of the genome."
Node: dcid:GenomeAssembly
name: "GenomeAssembly"
typeOf: schema:Class
subClassOf: dcs:GenomeAnnotation
description: "The reference genome to which the associated nucleotides have been aligned."
Node: dcid:GenomeAssemblyUnit
name: "GenomeAssemblyUnit"
typeOf: schema:Class
subClassOf: dcs:GenomeAnnotation
description: "The unit of assembling a reference genome to which the associated nucleotides have been aligned. Each unit is typically defined by the location of the cell from which the DNA is located such as the nucleus or an organelle."
Node: dcid:GeneMendelianInheritanceInManIdentifierAssociation
name: "GeneMendelianInheritanceInManIdentifierAssociation"
typeOf: schema:Class
subClassOf: dcs:GeneticAssociation
description: "Report of the relationship between MIM numbers (OMIM), GeneIDs, and Records in MedGen."
descriptionUrl: "https://ftp.ncbi.nlm.nih.gov/gene/README"
Node: dcid:GeneOntologyTerm
name: "GeneOntologyTerm"
typeOf: schema:Class
subClassOf: dcs:GenomeAnnotation
abbreviation: "GO Term"
description: "A Gene Ontology (GO) term is a controlled vocabulary term used to describe the functions of genes and gene products (proteins and RNA) in a standardized way. It provides a structured representation of biological knowledge, enabling researchers to annotate genes and gene products, compare and integrate data, and explore networks and pathways. It has a heirarchical structure and consists of three seperate ontologies: Biological Process (BP), Molecular Function (MF), and Cellular Component (CC)."
Node: dcid:GeneReferenceIntoFunction
name: "GeneReferenceIntoFunction"
typeOf: schema:Class
subClassOf: dcs:GenomeAnnotation
description: "A GeneRIF (Gene Reference Into Function) is a concise phrase describing the function of a gene. It provides a quick summary of the gene's role, linking the gene to its known or predicted biological function. GeneRIFs are manually curated from published literature and stored in the NCBI Gene database."
Node: dcid:GenomicCoordinates
name: "GenomicCoordinates"
typeOf: schema:Class
subClassOf: dcs:GenomeAnnotation
description: "The location in the genome or DNA conting of an element of interest. This is reported in the standardized format of [chrom, chromStart, chromEnd]. These coordinates are specific to any given genome assembly."
Node: dcid:GenomicPosition
name: "GenomicPosition"
typeOf: schema:Class
subClassOf: dcs:GenomeAnnotation
description: "The precise nucleotide location in thegenome or DNA contigof an element of interest. This is reported in the standardized format of [chrom position]. This position is specific to any given genome assembly. Genomic position is typically used to refer to genetic variants"
Node: dcid:GenomicRegion
name: "GenomicRegion"
typeOf: schema:Class
subClassOf: dcs:GenomeAnnotation
description: "A genomic region refers to a contiguous stretch of DNA within an organism's genome. It can encompass a single gene, a group of genes, regulatory elements, or any other segment of DNA with a defined start and end point."
Node: dcid:NonCodingRNA
name: "NonCodingRNA"
typeOf: schema:Class
subClassOf: dcs:Gene
description: "A non-coding RNA (ncRNA) is a functional RNA molecule that is not translated into a protein. The DNA sequence from which a functional non-coding RNA is transcribed is often called an RNA gene. Abundant and functionally important types of non-coding RNAs include transfer RNAs (tRNAs) and ribosomal RNAs (rRNAs), as well as small RNAs such as microRNAs, siRNAs, piRNAs, snoRNAs, snRNAs, exRNAs, scaRNAs and the long ncRNAs such as Xist and HOTAIR."
descriptionUrl: "https://en.wikipedia.org/wiki/Non-coding_RNA"
Node: dcid:Nucleotide
name: "Nucleotide"
typeOf: schema:Class
subClassOf: dcs:GenomeAnnotation
description: "A recorded nucleotide on the positive strand of a denoted genome assembly."
Node: dcid:MaturePeptide
name: "MaturePeptide"
typeOf: schema:Class
subClassOf: dcs:Protein
description: "A mature peptides represents the final, functional form of a protein after it has undergone post-translational modifications and processing. These modifications can include: cleavage, chemical modifications, and formation of disulfide bonds. It represents the active form of the protein that carries out its biological role. Mature peptides play crucial roles in various cellular processes, including signaling, enzymatic activity, structural support, and immune response."
Node: dcid:MendelianInheritanceInManEntity
name: "MendelianInheritanceInManEntity"
typeOf: schema:Class
subClassOf: dcs:GenomeAnnotation
description: "An entity representing a human gene or genetic phenotype in Online Mendelian Inheritance in Man (OMIM)."
url: "https://www.omim.org/"
Node: dcid:RnaTranscript
name: "RnaTranscript"
typeOf: schema:Class
subClassOf: dcs:GenomeAnnotation
description: "Recorded transcript. Unique identifier (GENCODE transcript ID for GENCODE Basic)."
Node: dcid:SequenceOntologyTerm
name: "SequenceOntologyTerm"
typeOf: schema:Class
subClassOf: dcs:GenomeAnnotation
description: "The Sequence Ontology (SO) is a set of terms and relationships used to describe the features and attributes of biological sequence. SO includes different kinds of features which can be located on the sequence. Biological features are those which are defined by their disposition to be involved in a biological process. Examples are binding_site and exon. Biomaterial features are those which are intended for use in an experiment such as aptamer and PCR_product. There are also experimental features which are the result of an experiment. SO also provides a rich set of attributes to describe these features such as polycistronic and maternally_imprinted."
descriptionUrl: "http://www.sequenceontology.org/"
Node: dcid:SequenceOntologyTermSynonym
name: "SequenceOntologyTermSynonym"
typeOf: schema:Class
subClassOf: dcs:SequenceOntologyTerm
description: "These are the synonyms for a SequenceOntologyTerm node. This includes information about the closeness of the match with the SequenceOntologyTerm, the source of the information, and a string value of the synonym itself."
Node: dcid:UmlsConceptUniqueIdentifier
name: "UmlsConceptUniqueIdentifier"
typeOf: schema:Class
subClassOf: dcs:BiomedicalEntity
synonym: "MedGen Concept ID", "CUI"
description: "A Concept Unique Identifer (CUI) for a entity in MedGen, which is NCBI's portal to information about conditions and phenotypes related to Medical Genetics. Terms from the NIH Genetic Testing Registry (GTR), UMLS, HPO, Orphanet, ClinVar and other sources are aggregated into concepts, each of which is assigned a unique identifier and a preferred name and symbol. The core content of the record may include names, identifiers used by other databases, mode of inheritance, clinical features, and map location of the loci affecting the disorder. The concept identifier (CUI) is used to aggregate information about that concept, similar to the way NCBI Gene serves as a gateway to gene-related information."
descriptionUrl: "https://www.ncbi.nlm.nih.gov/medgen/docs/help/"
# Properties
Node: dcid:agiLocusCode
name: "agiLocusCode"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: schema:Text
synonym: "Arabidopsis Genome Initiative"
description: "The Arabidopsis Information Resource (TAIR) is a continuously updated, online database of genetic and molecular biology data for the model plant Arabidopsis thaliana that provides a global research community with centralized access to data for over 30,000 Arabidopsis genes. Each locus in Arabidopsis is assigned a unique identifier, termed the AGI locus code (AGI, Arabidopsis Genome Initiative) which consists of the prefix At, followed by the chromosome identifier (1-5 or M or C) followed by g for gene and then a unique 5 digit number (e.g. At2g46340). These AGI locus codes are used by other Arabidopsis resources in addition to TAIR, such as Araport."
descriptionUrl: "https://www.ncbi.nlm.nih.gov/pmc/articles/PMC4545719/)."
url: "https://www.arabidopsis.org/"
Node: dcid:alleleOrigin
name: "alleleOrigin"
typeOf: schema:Property
rangeIncludes: dcs:VariantAlleleOriginEnum
domainIncludes: dcs:GeneticVariant
description: "Variant Allele Origin: unspecified, germline, somatic, both, inherited, paternal, maternal, uni-parental, bi-parental, not_tested, tested_inconclusive, de-novo, or other."
Node: dcid:alleleType
name: "alleleType"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:GeneticVariant
description: "The allele of a genetic variant observed within a population."
Node: dcid:allianceOfGenomeResourcesId
name: "allianceOfGenomeResourcesId"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: schema:Text
description: "The gene identifier used by the Alliance of Genome Resources, which is a consortium of seven model organism databases (MODs) and the Gene Ontology (GO) Consortium whose goal is to provide an integrated view of their data to all biologists, clinicians and other interested parties.The primary mission of the Alliance of Genome Resources (the Alliance) is to develop and maintain sustainable genome information resources that facilitate the use of diverse model organisms in understanding the genetic and genomic basis of human biology, health and disease. The seven model organism databases managed by the consortium is as follows: FlyBase, Mouse Genome Database (MGD), Rat Genome Database (RGD), Saccharomyces Genome Database (SGD), WormBase, XenBase, Zebrafish Information Network (ZFIN), and the Genome Ontology Consortium (GOC)."
url: "https://www.alliancegenome.org/"
Node: dcid:animalQuantitativeTraitLociId
name: "animalQuantitativeTraitLociId"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: schema:Text
abbreviation: "animal QTL Id"
description: "The gene identifier used by The Animal Quantitative Trait Loci (QTL) Database (Animal QTLdb), a database that strives to collect all publicly available trait mapping data, i.e. QTL (phenotype/expression, eQTL), candidate gene and association data (GWAS), and copy number variations (CNV) mapped to livestock animal genomes, in order to facilitate locating and comparing discoveries within and between species. It supports information on cattle, chickens, horses, goats, pigs, rainbow trout, and sheep."
descriptionUrl: "https://www.animalgenome.org/cgi-bin/QTLdb/index"
Node: dcid:alternateGeneSymbol
name: "alternateGeneSymbol"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:Gene
description: "Alternative or secondary symbol for a gene."
Node: dcid:aphidBaseId
name: "aphidBaseId"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: schema:Text
description: "The gene identifier used by AphidBase, which is a reference information system providing genomic resources for the study of aphids. It hosts several reference aphid genomes, including the first aphid genome that was sequenced: Acyrthosiphon pisum."
descriptionUrl: "https://bipaa.genouest.org/is/aphidbase/"
Node: dcid:asapId
name: "asapId"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: schema:Text
synonym: "A Systematic Annotation Package for Community Analysis of Genomes ID"
description: "The gene identifier used by ASAP (a systematic annotation package for community analysis of genomes), which is is a relational database and web interface developed to store, update and distribute genome sequence data and gene expression data collected by or in collaboration with researchers at the University of Wisconsin - Madison."
descriptionUrl: "http://asap.ahabs.wisc.edu/asap/ASAP1.htm"
url: "https://asap.ahabs.wisc.edu/"
Node: dcid:assemblyMethod
dcid: "assemblyMethod"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:GenomeAssembly
description: "The alogrithm used to assemble the genome from sequencing reads."
Node: dcid:associationSource
name: "associationSource"
typeOf: schema:Property
domainIncludes: schema:Thing
rangeIncludes: schema:Text
description: "The organization that reported an association between two things."
Node: dcid:associationType
name: "associationType"
typeOf: schema:Property
domainIncludes: schema:Thing
rangeIncludes: dcs:AssociationTypeEnum
description: "The way by which an association between two entities is made."
Node: dcid:averageHeterozygosity
name: "averageHeterozygosity"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:GeneticVariant
description: "Average heterozygosity from all observations. Note: may be computed on small number of samples."
Node: dcid:averageHeterozygositySE
name: "averageHeterozygositySE"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:GeneticVariant
description: "Standard Error for the average heterozygosity."
Node: dcid:beetleBaseId
name: "beetleBaseId"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: schema:Text
description: "The gene identifiers formatted as 'TC######' used by BeetleBase, which contains comprehensive genomic information for the red flour beetle Tribolium castaneum."
descriptionUrl: "https://www.ncbi.nlm.nih.gov/pmc/articles/PMC2808946/"
Node: dcid:betaDistributionShapes
name: "betaDistributionShapes"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:GeneGeneticVariantAssociation
description: "The shape parameters of the fitted Beta distribution: B(shape1, shape2)."
Node: dcid:bovineGenomeDatabaseId
name: "bovineGenomeDatabaseId"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: schema:Text
abbreviation: "BGD ID"
description: "The gene identifier used by the Bovine Genome Database (BGD), which supports the efforts of bovine genomics researchers by providing data mining, genome navigation and annotation tools for the bovine reference genome based on the hereford cow, L1 Dominette 01449."
descriptionUrl: "https://bovinegenome.elsiklab.missouri.edu/"
Node: dcid:chickenGeneNomenclatureConsortiumId
name: "chickenGeneNomenclatureConsortiumId"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: schema:Text
abbreviation: "CGNC ID"
description: "The gene identifier used by the Chicken Gene Nomenclature Consortium (CGNC), which is an international group of researchers interested in providing standardized gene nomenclature for chicken genes."
descriptionUrl: "http://birdgenenames.org/cgnc/about.jsp"
Node: dcid:chrom
name: "chrom"
typeOf: schema:Property
domainIncludes: dcs:GenomeAnnotation
rangeIncludes: schema:Text,dcs:Chromosome
description: "Chromosome (e.g. chr3, chrY, chr2_random) or scaffold (e.g. scaffold10671) name."
descriptionUrl: "https://en.wikipedia.org/wiki/BED_(file_format)"
Node: dcid:chromosomeSize
name: "chromosomeSize"
typeOf: schema:Property
rangeIncludes: schema:Quantity
domainIncludes: dcs:Chromosome
description: "The number of nucleotides in a given chromosome."
Node: dcid:chromStart
name: "chromStart"
typeOf: schema:Property
domainIncludes: dcs:GenomeAnnotation
rangeIncludes: schema:Number
description: "Start coordinate on the chromosome or scaffold for the sequence considered (the first base on the chromosome is numbered 0)."
descriptionUrl: "https://en.wikipedia.org/wiki/BED_(file_format)"
Node: dcid:chromEnd
name: "chromEnd"
typeOf: schema:Property
domainIncludes: dcs:GenomeAnnotation
rangeIncludes: schema:Number
description: "End coordinate on the chromosome or scaffold for the sequence considered. This position is non-inclusive, unlike chromStart."
descriptionUrl: "https://en.wikipedia.org/wiki/BED_(file_format)"
Node: dcid:clinicalSignificance
name: "clinicalSignificance"
typeOf: schema:Property
rangeIncludes: dcs:ClinSigEnum
domainIncludes: dcs:GeneticVariant
description: "Clinical significance for this single variant: other, affects, uncertain_significance, pathogenic, risk_factor, benign, conflicting_interpretations_of_pathogenicity, association, likely_pathogenic, protective, likely_benign, not_provided, association_not_found, drug_response, pathogenic/likely_pathogenic,benign/likely_benign, unknown, untested, or histocompatibility."
Node: dcid:clinicalSource
name: "clinicalSource"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:GeneticVariant
description: "The variant's clinical sources reported as tag-value pairs of database and variant identifier."
Node: dcid:clinVarAlleleID
name: "clinVarAlleleID"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:GeneticVariant
description: "ClinVar Allele ID."
Node: dcid:clinicalSignificanceType
name: "clinicalSignificanceType"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:GeneticVariant
description: "A type of clinical significance report observed for a genetic variant."
Node: dcid:clinVarFilterStatus
name: "clinVarFilterStatus"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:GeneticVariant
description: "Filter status: PASS if this position has passed all filters, i.e., a call is made at this position. Otherwise, if the filters that the site failed are recorded."
Node: dcid:clinVarQualityScore
name: "clinVarQualityScore"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:GeneticVariant
description: "Phred-scaled quality score for the assertion made in ALT. i.e. -10log10 prob(call in ALT is wrong)."
Node: dcid:clinVarReviewStatus
name: "clinVarReviewStatus"
typeOf: schema:Property
rangeIncludes: dcs:ClinVarReviewStatusEnum
domainIncludes: dcs:GeneticVariant
description: "ClinVar review status: no assertion criteria provided, reviewed by expert panel, conflicting interpretations, criteria provided, non interpretation for the single variant, practice guideline, no conflicts, multiple submitters, or single_submitter."
Node: codingCoordinates
dcid:codingCoordinates
name: "codingCoordinates"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:RnaTranscript
description: "Specifies the genomic position of the genomic coordinates of the coding region associated with a given RefSeq Accession number."
Node: dcid:confidence
name: "confidence"
typeOf: schema:Property
domainIncludes: schema:Thing
rangeIncludes: schema:Text
description: "The level of confidence that a given result is accurate."
Node: dcid:contigCount
name: "contigCount"
typeOf: schema:Property
domainIncludes: dcs:GenomeAssembly
rangeIncludes: schema:Text
description: "The number of contigs in the primary assembly."
descriptionUrl: "https://ftp.ncbi.nlm.nih.gov/genomes/README_assembly_summary.txt"
Node: dcid:cytogeneticMapLocation
name: "cytogeneticMapLocation"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:Gene
description: "The location of the gene on the chromosome. Each chromosome has a distinct banding pattern, and each band is numbered to help identify a particular region of a chromosome. This method of mapping a gene to a particular band of the chromosome is called cytogenetic mapping. For example, the hemoglobin beta gene (HBB) is found on chromosome 11p15.4. This means that the HBB gene lies on the short arm (p) of chromosome 11 and is found at the band labeled 15.4."
descriptionUrl: "https://www.ncbi.nlm.nih.gov/books/NBK22266/"
Node: dcid:dbSNPBuildID
name: "dbSNPBuildID"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:GeneticVariant
description: "First dbSNP Build for RS."
Node: dcid:dbVarID
name: "dbVarID"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:GeneticVariant
description: "Accessions from dbVar for the genetic variant"
descriptionUrl: "https://www.ncbi.nlm.nih.gov/dbvar/"
Node: dcid:dictyBaseGeneId
name: "dictyBaseGeneId"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: schema:Text
description: "The gene identifier used by dictyBase, an online bioinformatics database dedicated to the model organism Dictyostelium discoideum."
url: "http://dictybase.org/"
Node: dcid:digitalObjectIdentifier
name: "digitalObjectIdentifier"
typeOf: schema:Property
domainIncludes: dcs:Thing
rangeIncludes: schema:Text
abbreviation: "DOI"
description: "A DOI name is a digital identifier of an object, any object - physical, digital, or abstract. DOIs solve a common problem: keeping track of things. Things can be matter, material, content, or activities. Designed to be used by humans as well as machines, DOIs identify objects persistently. They allow things to be uniquely identified and accessed reliably. You know what you have, where it is, and others can track it too."
descriptionUrl: "https://www.doi.org/"
Node: dcid:diseaseDescription
name: "diseaseDescription"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:GeneticVariant
description: "ClinVar's preferred disease name for the concept specified by disease identifiers."
Node: dcid:diseaseName
name: "diseaseName"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:GeneticVariant
description: "ClinVar's preferred disease name for the concept specified by disease identifiers."
Node: dcid:dnaSequenceRole
name: "dnaSequenceRole"
typeOf: schema:Property
rangeIncludes: dcs:DNASequenceRoleEnum
domainIncludes: dcs:Chromosome
description: "The role a defined sequence of DNA has in a genome assembly."
Node: dcid:ecoCycAccessionId
name: "ecoCycAccessionId"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: schema:Text
description: "The gene identifier used by BioCyc, which is a collection of 20,050 Pathway/Genome Databases (PGDBs) for model eukaryotes and for thousands of microbes, plus software tools for exploring them. BioCyc is an encyclopedic reference that contains curated data from 146,000 publications."
descriptionUrl: "https://biocyc.org/"
Node: dcid:echinoBaseGeneId
name: "echinoBaseGeneId"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: schema:Text
description: "The gene identifier used by Echinobase, which supports the international research community by providing a centralized, integrated and easy to use web based resource to access the diverse and rich, functional genomics data of echinoderm species."
descriptionUrl: "https://www.echinobase.org/echinobase/"
Node: dcid:encodesGene
name: "encodesGene"
typeOf: schema:Property
domainIncludes: dcs:GenomicRegion
rangeIncludes: dcs:Gene
description: "Indicates the gene that the specific genomic region of DNA encodes."
Node: dcid:ensemblID
name: "ensemblID"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:Gene,dcs:GeneGeneticVariantAssociation,dcs:Protein
description: "Ensembl ID, which describes a particular gene or protein."
Node: dcid:ensemblGeneId
name: "ensemblGeneId"
typeOf: schema:Property
domainIncludes: dcs:Gene, dcs:RnaTranscript, dcs:Protein
rangeIncludes: schema:Text
specializationOf: dcs:ensemblID
description: "Gene identifier used by Ensembl, which represents a specific genomic locus that is predicted to encode a protein or a functional RNA molecule. They are formatted starting with the prefix 'ENSG' followed by a unique number (e.g. ENSG00000139618 (Human BRCA2 gene)). This locus represents all known transcripts and protein products that originate from this locus, even if they have different splicing patterns or protein isoforms."
Node: dcid:ensemblProteinId
name: "ensemblProteinId"
typeOf: schema:Property
domainIncludes: dcs:Gene, dcs:RnaTranscript, dcs:Protein
rangeIncludes: schema:Text
specializationOf: dcs:ensemblID
description: "Protein identifier used by Ensembl, which represents a specific protein sequence translated from an mRNA transcript. They are formatted starting with the prefix 'ENSP' followed by a unique number (e.g. ENSP00000369406 (One of the protein isoforms encoded by the Human BRCA2 gene)). This represents the amino acid sequence that results from the specific combination of exons in the corresponding mRNA."
Node: dcid:ensemblRapidReleaseId
name: "ensemblRapidReleaseId"
typeOf: schema:Property
domainIncludes: dcs:Gene, dcs:RnaTranscript, dcs:Protein
rangeIncludes: schema:Text
specializationOf: dcs:ensemblID
Node: dcid:ensemblRapidReleaseId
name: "ensemblRapidReleaseId"
typeOf: schema:Property
domainIncludes: dcs:Gene, dcs:RnaTranscript, dcs:Protein
rangeIncludes: schema:Text
specializationOf: dcs:ensemblID
description: "Ensembl Rapid Release IDs are unique identifiers assigned to genomic features (primarily genes, but also transcripts and proteins) in newly sequenced genomes that are made available quickly through Ensembl's Rapid Release pipeline. This program has a release cycle of two weeks and the identifiers provide early access to gene annotation for genomes that are not yet fully integrated into the main Ensembl database."
Node: dcid:ensemblRnaId
name: "ensemblRnaId"
typeOf: schema:Property
domainIncludes: dcs:Gene, dcs:RnaTranscript, dcs:Protein
rangeIncludes: schema:Text
specializationOf: dcs:ensemblID
description: "RNA sequence identifier used by Ensembl, which represents a specific RNA transcript produced from a gene. This could be a messenger RNA (mRNA) that encodes a protein or other types of RNA such as long non-coding RNAs (lncRNAs) or microRNAs (miRNAs). They are formatted starting with the prefix 'ENST' followed by a unique number (e.g. ENST00000380152 (One of the many transcripts of the Human BRCA2 gene). This represents the specific combination of exons included in the mature transcript due to alternative splicing."
Node: dcid:experimentalFactorOntologyID
name: "experimentalFactorOntologyID"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:GeneticVariant
description: "The Experimental Factor Ontology (EFO) provides a systematic description of many experimental variables available in EBI databases, and for external projects such as the NHGRI GWAS catalog."
descriptionUrl: "https://www.ebi.ac.uk/efo/"
abbreviation: "EFO ID"
Node: dcid:flyBaseId
name: "flyBaseId"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: schema:Text
specializationOf: dcs:allianceOfGenomeResourcesId
description: "The gene identifier used by FlyBase. The aim of the FlyBase project is to provide an openly accessible centralized resource for Drosophila genetic, genomic and functional data. FlyBase is a member of the Alliance of Genome Resources."
descriptionUrl:"https://wiki.flybase.org/wiki/FlyBase:About#FlyBase_Mission_Statement"
url:"https://flybase.org/"
Node: dcid:frequency
typeOf: schema:Property
domainIncludes: dcid:Allele
rangeIncludes: schema:Number
name: "frequency"
Node: dcid:fullName
name: "fullName"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:Gene
description: "The full name of the gene."
Node: dcid:gcContent
name: "gcContent"
typeOf: schema:Property
domainIncludes: dcs:GenomeAnnotation
rangeIncludes: schema:Quantity
description: "Percent of nitrogenous bases (guanine or cytosine) in DNA submitted for the assembly, rounded to the nearest 0.5%."
descriptionUrl: "https://ftp.ncbi.nlm.nih.gov/genomes/README_assembly_summary.txt"
Node: dcid:genBankAssemblyAccession
name: "genBankAssemblyAccession"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:BiologicalEntity
description: "The accession version of the GenBank assembly or sequence element."
Node: dcid:genBankNucleotideAccession
name: "genBankNucleotideAccession"
typeOf: schema:Property
domainIncludes dcs:GenomeAssembly
rangeIncludes: schema:Text
description: "WGS-master: the GenBank Nucleotide accession and version for the master record of the Whole Genome Shotgun (WGS) project for the genome assembly. The master record can be retrieved from the NCBI Nucleotide resource: https://www.ncbi.nlm.nih.gov/nuccore. Genome assemblies that are complete genomes, and those that are clone-based, do not have WGS-master records. GenBank uses a different format for accessions of sequences that are a part of the WGS project."
descriptionUrl: "https://ftp.ncbi.nlm.nih.gov/genomes/README_assembly_summary.txt"
Node: dcid:geneCount
name: "geneCount"
typeOf: schema:Property
domainIncludes: dcs:GenomeAnnotation
rangeIncludes: schema:Number
description: "The total number of genes (both protein coding and non-coding genes) within a consensus region of DNA."
Node: dcid:geneGeneOntologyTermRelationshipQualifier
name: "geneGeneOntologyTermRelationshipQualifier"
typeOf: schema:Property
domainIncludes: dcs:GeneOntologyTerm
rangeIncludes: dcs:GOTermQualifierEnum
description: "The nature of the association between the gene product and the GO term."
Node: dcid:geneID
name: "geneID"
typeOf: schema:Property
rangeIncludes: dcs:Gene
domainIncludes: dcs:GeneticAssociation,dcs:GeneticVariant,dcs:Protein
description: "Link out to the Gene node associated with the current node."
Node: dcid:geneOmimRelationshipComment
name: "geneOmimRelationshipComment"
typeOf: schema:Property
domainIncludes: dcs:GeneMendelianInheritanceInManIdentifierAssociation
rangeIncludes: dcs:GeneOmimRelationshipCommentEnum
description: "The qualifiers OMIM provides when reporting a gene/phenotype relationship."
descriptionUrl: "https://ftp.ncbi.nlm.nih.gov/gene/README"
Node: dcid:geneOmimRelationshipSource
name: "geneOmimRelationshipSource"
typeOf: schema:Property
domainIncludes: dcs:GeneMendelianInheritanceInManIdentifierAssociation
rangeIncludes: dcs:GeneOmimRelationshipSourceEnum
description: "The source of a report of a relationship between a MIM number that is a phenotype, and a Gene."
descriptionUrl: "https://ftp.ncbi.nlm.nih.gov/gene/README"
Node: dcid:geneOmimRelationshipType
name: "geneOmimRelationshipType"
typeOf: schema:Property
domainIncludes: dcs:GeneMendelianInheritanceInManIdentifierAssociation
rangeIncludes: dcs:GeneOmimRelationshipTypeEnum
description: "The type of relationship between the MIM number and the GeneID. The current values are 'gene' (the MIM number associated with a Gene, or a Gene that is assigned to a record where the molecular basis of the disease is not known) and 'phenotype' the MIM number associated with a disease that is associated with a gene."
descriptionUrl: "https://ftp.ncbi.nlm.nih.gov/gene/README"
Node: dcid:geneOntologyCategory
name: "geneOntologyCategory"
typeOf: schema:Property
domainIncludes: dcs:GeneOntologyTerm
rangeIncludes: dcs:GeneOntologyCategoryEnum
description: "Indicates which of the three ontologies to which the Gene Ontology Term belongs: Biological Process (BP), Cellular Component (CC), or Molecular Function (MF)."
Node: dcid:geneOntologyEvidenceCode
name: "geneOntologyEvidenceCode"
typeOf: schema:Property
domainIncludes: dcs:GeneOntologyTerm
rangeIncludes: dcs:GOTermEvidenceCodeEnum
description: "The evidence code that is associated with a Gene Ontology (GO) term. This indicates the type of evidence supporting the association between the gene product and the GO term (e.g., experimental, computational, or other evidence)."
Node: dcid:geneOntologyId
name: "geneOntologyId"
typeOf: schema:Property
domainIncludes: dcs:GeneOntologyTerm
rangeIncludes: dcs:GOTermEvidenceCodeEnum
description: "Every term has a human-readable term name - e.g. mitochondrion, glucose transmembrane transport, or amino acid building - and a GO ID, a unique seven digit identifier prefixed by GO:, e.g. GO:0005739, GO:1904659, or GO:0016597."
descriptionUrl: "https://geneontology.org/docs/GO-term-elements"
Node: dcid:geneOrtholog
name: "geneOrtholog"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: dcs:Gene
description: "Orthologs are genes in different specise taht can be traced back to the sam gene in the most recent common ancestor."
descriptionUrl: "https://ftp.ncbi.nlm.nih.gov/gene/README"
Node: dcid:genePotentialReadthroughSibling
name: "genePotentialReadthroughSibling"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: dcs:Gene
description: "A gene that is located close to another gene on the same DNA strand and might be transcribed together into a single RNA molecule due to the lack of a strong termination signal between them. Further analysis is needed to confirm if this readthrough actually occurs."
Node: dcid:geneReadthroughChild
name: "geneReadthroughChild"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: dcs:Gene
description: "A gene that is formed when the transcription of an upstream gene (the 'parent') continues past its normal termination signal and into the downstream region, creating a longer RNA transcript that includes the sequence of the 'child' gene."
Node: dcid:geneReadthroughParent
name: "geneReadthroughParent"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: dcs:Gene
description: "The upstream gene in a readthrough relationship. It is the gene whose transcription continues past its normal termination point, leading to the formation of a readthrough child gene."
Node: dcid:geneReadthroughSibling
name: "geneReadthroughSibling"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: dcs:Gene
description: "Genes located on the same DNA strand that are transcribed together into a single RNA molecule due to the lack of a strong termination signal between them. This is confirmed to occur."
Node: dcid:geneRegionMember
name: "geneRegionMember"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: dcs:Gene
description: "A gene located within a defined genomic region. This region might be associated with a specific function, regulatory element, or evolutionary history."
Node: dcid:geneRegionParent
name: "geneRegionParent"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: dcs:Gene
description: "A larger genomic region that encompasses multiple genes, including the 'region member'."
Node: dcid:geneReferenceIntoFunction
name: "geneReferenceIntoFunction"
typeOf: schema:Property
domainIncludes: dcs:GeneReferenceIntoFunction
rangeIncludes: schema:Text
description: "A short, specific summary of a gene's biological function, which is supported by citations from scientific literature."
Node: dcid:geneSymbol
name: "geneSymbol"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:Gene,dcs:GeneticVariant,dcs:GeneticAssociation,dcs:Protein
description: "Original gene symbol."
Node: dcid:geneticRepliconCount
name: "geneticRepliconCount"
typeOf: schema:Property
domainIncludes dcs:GenomeAssembly
rangeIncludes: schema:Number
description: "The total number of chromosomes, organelle genomes, and plasmids in the primary assembly."
descriptionUrl: "https://ftp.ncbi.nlm.nih.gov/genomes/README_assembly_summary.txt"
Node: dcid:geneReviewsID
name: "geneReviewsID"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:GeneticVariant
description: "GeneReviews, an international point-of-care resource for busy clinicians, provides clinically relevant and medically actionable information for inherited conditions in a standardized journal-style format, covering diagnosis, management, and genetic counseling for patients and their families. Each chapter in GeneReviews is written by one or more experts on the specific condition or disease and goes through a rigorous editing and peer review process before being published online."
descriptionUrl: "https://www.ncbi.nlm.nih.gov/books/NBK1116/"
Node: dcid:geneticScaffoldCount
name: "geneticScaffoldCount"
typeOf: schema:Property
domainIncludes dcs:GenomeAssembly
rangeIncludes: schema:Number
description: "The number of scaffolds including placed, unlocalized, unplaced, alternate loci and patch scaffolds in the primary assembly."
descriptionUrl: "https://ftp.ncbi.nlm.nih.gov/genomes/README_assembly_summary.txt"
Node: dcid:geneticsHomeReferenceID
name: "geneticsHomeReferenceID"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:GeneticVariant
description: "Genetics Home Reference (GHR) provides consumer-friendly information about the effects of genetic variation on human health."
descriptionUrl: "https://ghr.nlm.nih.gov/"
abbreviation: "GHR ID"
Node: dcid:geneticTestingRegistryID
name: "geneticTestingRegistryID"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:GeneticVariant
description: "The Genetic Testing Registry (GTR) provides a central location for voluntary submission of genetic test information by providers. The scope includes the test's purpose, methodology, validity, evidence of the test's usefulness, and laboratory contacts and credentials. The overarching goal of the GTR is to advance the public health and research into the genetic basis of health and disease."
descriptionUrl: "https://www.ncbi.nlm.nih.gov/gtr/"
abbreviation: "GTR ID"
Node: dcid:geneticVariantAlignmentQuality
name: "geneticVariantAlignmentQuality"
typeOf: schema:Property
rangeIncludes: dcs:GeneticVariantAlignmentQualityEnum
domainIncludes: dcs:GeneticVariant
description: "The quality of the alignment: unique mapping, non-unique, and many matches (1, 2, or 3+)."
Node: dcid:geneticVariantAttribute
name: "geneticVariantAttribute"
typeOf: schema:Property
rangeIncludes: dcs:GeneticVariantAttributeEnum
domainIncludes: dcs:GeneticVariant
description: "Genetic variant attributes extracted from dbSNP's SNP_bitfield table: clinically associated, MAF >5% in some populations, MAF >5% in all populations, has OMIM OMIA, microattribute tpa, submitted by locus-specific database, genotype conflict, rs cluster non-overlapping alleles, observed mismatch, pharmGKB, published, 3D structure, submitter link out, other variant with exact mapping, assembly specific,mutant, validated, included in high density kit, genotypes available, 1000 Genomes Phase 1, 1000 Genomes Phase 3, included in clinical diagnostic assay, withdrawn by some not all submitters, or common SNP."
Node: dcid:geneticVariantClass
name: "geneticVariantClass"
typeOf: schema:Property
rangeIncludes: dcs:GeneticVariantClassEnum
domainIncludes: dcs:GeneticVariant
description: "Class of variant: single_nucleotide_variant, deletion, insertion, in-del, named, mixed, mnp, het, microsatellite, inversion, copy_number_loss, variation, duplication, or copy_number_gain."
Node: dcid:geneticVariantExceptions
name: "geneticVariantExceptions"
typeOf: schema:Property
rangeIncludes: dcs:GeneticVariantExceptionEnum
domainIncludes: dcs:GeneticVariant
description: "Unusual conditions noted by UCSC that may indicate a problem with the data."
Node: dcid:geneticVariantFunctionalCategory
name: "geneticVariantFunctionalCategory"
typeOf: schema:Property
rangeIncludes: dcs:GeneticVariantFunctionalCategoryEnum
domainIncludes: dcs:GeneticVariant
description: "Functional category of the genetic variant (coding-synon, splice_5', missense, frameshift, near_gene_5', 3'_UTR, near_gene_3', nonsense, splice_3', intron, cds_reference, 5'_UTR, unknown, cds_indel, stop_loss, 5' UTR, or ncRNA.)"
Node: dcid:geneticVariantID
name: "geneticVariantID"
typeOf: schema:Property
rangeIncludes: dcs:GeneticVariant
domainIncludes: dcs:GeneGeneticVariantAssociation
description: "Link out to GeneticVariant node associated with the current node."
Node: dcid:geneticVariantImpercise
name: "geneticVariantImpercise"
typeOf: schema:Property
rangeIncludes: schema:Boolean
domainIncludes: dcs:GeneticVariant
description: "Boolean of whether a variant is flagged as an imprecise structural variation."
Node: dcid:geneticVariantLength
name: "geneticVariantLength"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:GeneticVariant
description: "Difference in length between REF and ALT alleles (bp)."
Node: dcid:geneticVariantLocType
name: "geneticVariantLocType"
typeOf: schema:Property
rangeIncludes: dcs:GeneticVariantLocTypeEnum
domainIncludes: dcs:GeneticVariant
description: "Type of mapping inferred from size on reference; may not agree with class."
Node: dcid:geneticVariantSubmitterCount
name: "geneticVariantSubmitterCount"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:GeneticVariant
description: "Number of distinct submitter handles for submitted SNPs for this ref SNP."
Node: dcid:geneticVariantValidationStatus
name: "geneticVariantValidationStatus"
typeOf: schema:Property
rangeIncludes: dcs:GeneticVariantValidationStatusEnum
domainIncludes: dcs:GeneticVariant
description: "Validation status of the SNP."
Node: dcid:genomeAnnotatedBy
name: "genomeAnnotatedBy"
typeOf: schema:Property
domainIncludes: dcs:GenomeAssembly
rangeIncludes: dcs:Lab,schema:Person,schema:Text
description: "The group that described the structure and identified functional elements of a genome sequence thereby by providing biological significance."
Node: dcid:genomeAssemblyDerivedFrom
name: "genomeAssemblyDerivedFrom"
typeOf: schema:Property
domainIncludes: dcs:GenomeAssembly
rangeIncludes: schema:Boolean
description: "Denotes the relation of the genome assembly with the type material from which it was derived."
Node: dcid:genomeAssemblyType
name: "genomeAssemblyType"
typeOf: schema:Property
rangeIncludes: dcs:GenomeAssemblyTypeEnum
domainIncludes: dcs:GenomeAssembly
description: "The type of sequence model data defined in this genome assembly."
Node: dcid:genomeAssemblyLevel
name: "genomeAssemblyLevel"
typeOf: schema:Property
rangeIncludes: dcs:GenomeAssemblyLevelEnum
domainIncludes: dcs:GenomeAssembly
description: "The highest level of assembly for any object in the assembly."
descriptionUrl: "https://www.ncbi.nlm.nih.gov/assembly/help/#level"
Node: dcid:genomeAssemblyReleaseType
name: "genomeAssemblyReleaseType"
typeOf: schema:Property
rangeIncludes: dcs:GenomeAssemblyReleaseTypeEnum
domainIncludes: dcs:GenomeAssembly
description: "Defines the update type of this genome assembly version release."
Node: dcid:genomeAssemblyYear
name: "genomeAssemblyYear"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:GenomeAssembly
description: "The year in which the genome assembly was released."
Node: dcid:genomeCoverage
name: "genomeCoverage"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:GenomeAssembly
description: "Genome coverage is the coverage depth of a sequencing run. This is calculated as the number of bases of all short reads that match a genome divided by the length of this genome, which represents the average number of times a base of a genome is sequenced."
Node: dcid:genomeReferenceConsortiumAssemblyName
name: "genomeReferenceConsortiumAssemblyName"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:GenomeAssembly
description: "The Genome Refrence Consortium name for the genome assembly."
abbreviation: "GRC assembly name"
Node: dcid:genomeSize
name: "genomeSize"
typeOf: schema:Property
domainIncludes: dcs:GenomeAssembly
rangeIncludes: schema:Quantity
description: "Total length of all top-level sequences in the primary assembly."
Node: dcid:genomeSizeUngapped
name: "genomeSizeUngapped"
typeOf: schema:Property
domainIncludes: dcs:GenomeAssembly
rangeIncludes: schema:Quantity
description: "Total length of all top-level sequences in the primary assembly ignoring gaps. Any stretch of 10 or more Ns in asequence is treated like a gap."
descriptionUrl: "https://ftp.ncbi.nlm.nih.gov/genomes/README_assembly_summary.txt"
Node: dcid:genomicCoordinates
name: "genomicCoordinates"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:Gene
description: "Start position (0 based). End position (non-inclusive). Represents the genomic coordinates of an object of interest."
Node: dcid:genomicPosition
name: "genomicPosition"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:Nucleotide,dcs:GeneticVariant
description: "The genomic position of the nucleotide."
Node: dcid:gtexID
name: "gtexID"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:GeneGeneticVariantAssociation
description: "An ID denoting a unique gene and genetic variant association within the GTEx database."
Node: dcid:hasGeneticVariantAnnotation
name: "hasGeneticVariantAnnotation"
typeOf: schema:Property
domainIncludes: dcs:Gene
rangeIncludes: schema:Boolean
description: "Indicates whether there are gene has genetic variants that are associated with it."
Node: dcid:hasGenomicCoordinates
name: "hasGenomicCoordinates"
typeOf: schema:Property
domainIncludes: dcs:GenomeAnnotation
rangeIncludes: dcs:GenomicCoordinates
description: "Genomic coordinates specify the location of the position of an element within a defined DNA contig. It is a specified set of chromosome start_position end_position within a specified genome assembly."
Node: dcid:hasGenomicPosition
name: "hasGenomicPosition"
typeOf: schema:Property
domainIncludes: dcs:GenomeAnnotation
rangeIncludes: dcs:GenomicPosition
description: "Genomic position specify the precise nucleotide location within a defined DNA contig. It is a specified set of chromosome and position within a specified genome assembly."
Node: dcid:hgncID
name: "hgncID"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:Gene
description: "HUGO Gene Nomenclature Committee identifier."
synonym: "HUGO Gene Nomenclature Committee ID"
Node: dcid:hg38DistanceFromTranscriptionStartSite
name: "hg38DistanceFromTranscriptionStartSite"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:GeneGeneticVariantAssociation
description: "In the hg38 genome assembly, the distance in base pairs between the associated genetic variant and gene."
abbreviation: "hg38 distance from TSS"
Node: dcid:hg19DistanceFromTranscriptionStartSite
name: "hg19DistanceFromTranscriptionStartSite"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:GeneGeneticVariantAssociation
description: "In the hg19 genome assembly, the distance in base pairs between the associated genetic variant and gene."
abbreviation: "hg19 distance from TSS"
Node: dcid:humanGenomeVariationSocietyNomenclature
name: "humanGenomeVariationSocietyNomenclature"
typeOf: schema:Property
rangeIncludes: schema:Number
domainIncludes: dcs:GeneticVariant
description: "Variant names from the Human Genome Variation Society"
descriptionUrl: "https://varnomen.hgvs.org/"
Node: dcid:humanPhenotypeOntologyID
name: "humanPhenotypeOntologyID"
typeOf: schema:Property
rangeIncludes: schema:Text
domainIncludes: dcs:GeneticVariant
description: "The Human Phenotype Ontology (HPO)"
descriptionUrl: "https://hpo.jax.org/app/"
Node: dcid:inChromosome
name: "inChromosome"
typeOf: schema:Property
rangeIncludes: dcs:Chromosome,schema:Text
domainIncludes: dcs:GenomeAnnotation,dcs:Chromosome
description: "A threadlike structure of nucleic acids and protein found in the nucleus of most living cells, carrying genetic information in the form of genes."