-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathgenomic_data.yaml
More file actions
271 lines (269 loc) · 8.09 KB
/
genomic_data.yaml
File metadata and controls
271 lines (269 loc) · 8.09 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
# this is an example of the OncoBlocks API
# as a demonstration of an API spec in YAML
swagger: '2.0'
info:
title: OncoBlocks API
description: OncoBlocks Open Cancer Genomics API.
version: "1.0.0"
# the domain of the service
host: api.oncoblocks.org
# array of all schemes that your API supports
schemes:
- https
# will be prefixed to all paths
basePath: /v1
produces:
- application/json
paths:
/signal:
get:
summary: Get discrete or continuous signal data.
description: Get discrete or continuous signal data, such as expression data, phosphoproteomic data or discretized copy number data.
parameters:
- name: sample_id
in: query
description: Samples ID(s).
required: false
type: array
items:
type: string
- name: entrez_gene_id
in: query
description: Entrez Gene ID(s).
required: false
type: array
items:
type: integer
- name: genome_coordinate
in: query
description: Genome coordinate(s), of the form chr:start-end.
required: false
type: array
items:
type: string
- name: study_id
in: query
description: Study ID(s).
required: false
type: string
- name: data_set_id
in: query
description: Data set ID.
required: true
type: string
responses:
200:
description: an array of signal objects.
schema:
title: Signals
type: array
items:
$ref: SignalData
/copy_number_regions:
get:
summary: Get copy number regions of interest.
description: Get copy number regions of interest, e.g. statistically significant regions of amplification or deletion identified by the GISTIC algorithm.
parameters:
- name: study_id
in: query
description: Study ID.
required: true
type: string
- name: data_set_id
in: query
description: Data Set ID.
required: true
type: string
responses:
200:
description: an array of copy number region objects.
schema:
title: RegionsOfInterest
type: array
items:
$ref: RegionOfInterest
/mutations:
get:
summary: Get mutation data.
description: Retrieves mutation data by mutation properties, sample, or gene.
parameters:
- name: sample_id
in: query
description: Samples ID(s).
required: false
type: array
items:
type: string
- name: entrez_gene_id
in: query
description: Entrez Gene ID(s).
required: false
type: array
items:
type: integer
- name: study_id
in: query
description: Study ID(s).
required: false
type: array
items:
type: string
- name: data_set_id
in: query
description: Data set ID.
required: false
type: array
items:
type: integer
- name: variant_classification
in: query
description: Mutation type(s).
required: false
type: array
items:
type: string
responses:
200:
description: an array of mutation data objects.
schema:
title: MutationData
type: array
items:
$ref: MutationData
definitions:
SignalData:
properties:
stable_sample_id:
type: integer
format: int32
description: Sample ID.
gene_id:
type: integer
format: int32
description: Entrez gene ID.
gene_symbol:
type: string
description: Official gene symbol.
genome_coordinates:
type: string
description: Genomic coordinates.
signal_value:
type: number
description: Signal intensity.
annotation_list:
description: Curated annotations regarding the signal or event.
type: array
items:
type: string
RegionOfInterest:
properties:
cytoband:
type: string
description: Cytoband.
q_value:
type: number
description: Q-Value.
residual_q_value:
type: number
description: Residual Q-Value.
wide_peak_boundaries:
type: string
description: Wide peak boundaries.
entrez_gene_list:
type: array
items:
type: integer
format: int32
MutationData:
properties:
stable_sample_id:
type: integer
format: int32
description: Sample ID.
gene_id:
type: integer
format: int32
description: Entrez gene ID.
gene_symbol:
type: string
description: Official gene symbol.
reference_genome:
type: string
description: Reference genome to which the DNA coordinates are aligned.
chromosome:
type: string
description: Chromosome in which the mutation is located.
dna_start_position:
type: integer
format: int32
description: Start position of the mutation in genomic DNA.
dna_end_position:
type: integer
format: int32
description: End position of the mutation in genomic DNA.
strand:
type: string
description: Chromosome strand in which the mutation is located.
variant_classification:
type: string
description: Specific category of mutation.
variant_type:
type: string
description: General category of mutation.
reference_allele:
type: string
description: Nucleotides of the reference DNA sequence.
variant_allele:
type: string
description: Nucelotides of the mutated DNA sequence.
alternative_allele_reads:
type: integer
format: int32
description: Number of reads supporting the mutant allele.
reference_allele_reads:
type: integer
format: int32
description: Number of reads supporting the wild type allele.
dbsnp_rsid:
type: string
description: dbSNP RS ID of the record of the mutation.
annotation_transcript:
type: string
description: Database ID of the cDNA transcript to which the cDNA coordinates are aligned.
transcript_strand:
type: string
description: Strand in the reference transcript to which the mutation coordinates are aligned.
cdna_change:
type: string
description: Change in he cDNA sequence.
codon_change:
type: string
description: Change in the cDNA sequence in the context of the codon.
protein_change:
type: string
description: Change in the amino acid sequence.
other_transcripts:
type: string
description: Delimited list of additional transcripts and amino acid changes associated with the genomic DNA mutation.
refseq_mrna_id:
type: string
description: ID of the RefSeq mRNA transcript for the mutated gene.
refseq_prot_id:
type: string
description: ID of the RefSeq amino acid transcript for the mutated protein.
swissprot_accession:
type: string
description: ID of the Swissprot amino acid transcript for the mutated protein.
swissprot_entry:
type: string
description: ID of the Swissprot gene record.
uniprot_aa_position:
type: integer
format: int32
description: Mutation position in the Uniprot amino acid transcript.
uniprot_region:
type: string
description: Protein region in which the mutation occurs in the Uniprot transcript.
uniprot_site:
type: string
description: Protein site in which the mutation occurs in the Uniprot transcript.