-
Notifications
You must be signed in to change notification settings - Fork 5
/
Copy pathdefault_variant_annotations_schema.yaml
144 lines (144 loc) · 4.45 KB
/
default_variant_annotations_schema.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
openapi: 3.0.2
servers: []
info:
version: "draft.3"
title: GA4GH Beacon Variant Annotation Default Schema
description: >-
Schema for variant annotations to be used as default by the Beacon.
contact:
email: [email protected]
license:
name: Apache 2.0
url: 'http://www.apache.org/licenses/LICENSE-2.0.html'
externalDocs:
description: |
Beacon Project
url: 'http://beacon-project.io/'
paths: {}
components:
schemas:
GenomicFeature:
description: |
Genomic feature(s) affected by the variant
type: object
properties:
class:
description: |
Class of genomic region affected by the variant
type: string
enum:
- gene
- protein coding transcript
- untranslated region
- non-coding transcript
example: "gene"
featureID:
description: |
ID /accession/name of genomic region affected by the variant, matching class in `class`
type: string
example:
- 'TP53'
- 'GeneID:43740578'
VariantAnnotation:
description: TBD # TBD
type: object
properties:
variantId:
description: |
Reference to Variant ID.
type: string
variantAlternativeId:
description: |
List of cross-referencing ID(s) (CURIE(s)) for the variant in the original
databases or variant-level (aggregated) databases for previously described
variants (e.g. clinVarId, ClinGen, COSMIC), e.g. "VCV000055583.1", "CA003602".
type: array
items:
type: string
example:
- 'rs80356868'
- 'CA003602'
- 'VCV000055583.1'
genomicHGVSId:
description: |
HGVSId descriptor at genomic level, referred to genome assembly
defined in Variant Identification.
type: string
example: 'NC_000011.9:g.134086816T>C'
transcriptHGVSId:
description: |
List of HGVSId descriptor(s) at transcript level.
type: array
items:
type: string
example:
- 'NC 000023.10(NM004006.2):c.357+1G'
proteinHGVSIds:
description: |
List of HGVSId descriptor(s) at protein level (for protein-altering
variants).
type: array
items:
type: string
example:
- 'NP_009225.1:p.Glu1817Ter'
- 'LRG 199p1:p.Val25Gly (preferred)'
genomicRegions:
description: |
List of classification(s) of the variant according to the genomic
region affected (all that apply, relative to each feature affected). Value from Ensembl
Glossary (ENSGLOSS)
type: array
items:
type: string
example:
- 'intergenic'
- '5UTR'
- '3UTR'
- 'coding'
genomicFeatures:
description: |
List of Genomic feature(s) affected by the variant.
type: array
items:
$ref: '#/components/schemas/GenomicFeature'
annotationToolVersion:
description: |
Tool used for annotation and prediction of variant effects
type: string
example: 'SnpEffVersion=4.3t (build 2017-11-24 1018)'
molecularEffect:
description: |
List of predicted effect at nucleotide level
type: array
items:
type: string
example:
- 'STOP_GAINED'
molecularConsequence:
description: |
List of Predicted effect at protein level for protein affecting variants (Ontology label)
type: array
items:
type: string
example:
- 'nonsense'
- 'missense'
aminoacidChange:
description: |
Lisf of change(s) at aminoacid level for protein affecting variants
type: array
items:
type: string
example:
- 'V304*'
info:
description: |
Additional unspecified metadata about the dataset response or its
content.
type: object
example:
additionalInfoKey1:
- additionalInfoValue1
- additionalInfoValue2
additionalInfoKey2: additionalInfoValue