publisci 0.1.3 → 0.1.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,54 +1,54 @@
1
1
  module PubliSci
2
- module Readers
3
- class RMatrix
4
- include PubliSci::Dataset::DataCube
2
+ module Readers
3
+ class RMatrix
4
+ include PubliSci::Dataset::DataCube
5
5
 
6
- #NOTE; this is pretty much hard coded for Karl's application right now, and doesn't
7
- # do any dimension or code generation. Since its a set of LOD scores indexed by dimension
8
- # and marker the usual datacube generator wont work (I think). In the future adding an option
9
- # to specify this kind of a dataset would probably be useful
6
+ #NOTE; this is pretty much hard coded for Karl's application right now, and doesn't
7
+ # do any dimension or code generation. Since its a set of LOD scores indexed by dimension
8
+ # and marker the usual datacube generator wont work (I think). In the future adding an option
9
+ # to specify this kind of a dataset would probably be useful
10
10
 
11
11
 
12
- def generate_n3(client, var, outfile_base, options={})
13
- meas = measures(client,var,options)
14
- dim = dimensions(client,var,options)
15
- codes = codes(client,var,options)
12
+ def generate_n3(client, var, outfile_base, options={})
13
+ meas = measures(client,var,options)
14
+ dim = dimensions(client,var,options)
15
+ codes = codes(client,var,options)
16
16
 
17
- outvar = sanitize([var]).first
17
+ outvar = sanitize([var]).first
18
18
 
19
- probes_per_file = options[:probes_per_file] || 100
20
- col_select = "colnames"
21
- col_select = "names" if options[:type] == :dataframe
19
+ probes_per_file = options[:probes_per_file] || 100
20
+ col_select = "colnames"
21
+ col_select = "names" if options[:type] == :dataframe
22
22
 
23
- #write structure
24
- open(outfile_base+'_structure.ttl','w'){|f| f.write structure(client,var,outvar,options)}
23
+ #write structure
24
+ open(outfile_base+'_structure.ttl','w'){|f| f.write structure(client,var,outvar,options)}
25
25
 
26
- probes=client.eval("#{col_select}(#{var})").to_ruby
27
- if probes == nil
28
- client.eval("colnames(#{var})=1:ncol(#{var})")
29
- probes=client.eval("#{col_select}(#{var})").to_ruby
30
- end
31
- markers = rows(client,var,options)
26
+ probes=client.eval("#{col_select}(#{var})").to_ruby
27
+ if probes == nil
28
+ client.eval("colnames(#{var})=1:ncol(#{var})")
29
+ probes=client.eval("#{col_select}(#{var})").to_ruby
30
+ end
31
+ markers = rows(client,var,options)
32
32
 
33
33
  if options[:print]
34
- puts prefixes(var,options)
34
+ puts prefixes(var,options)
35
35
  end
36
36
 
37
37
  if options[:output] == :string
38
- str = prefixes(var,options)
38
+ str = prefixes(var,options)
39
39
  end
40
40
 
41
- probes.each_with_index{|probe,i|
42
- #write prefixes and erase old file on first run
41
+ probes.each_with_index{|probe,i|
42
+ #write prefixes and erase old file on first run
43
43
  unless options[:print] || options[:output] == :string
44
- open(outfile_base+"_#{i/probes_per_file}.ttl",'w'){|f| f.write prefixes(var,options)} if i % probes_per_file == 0
44
+ open(outfile_base+"_#{i/probes_per_file}.ttl",'w'){|f| f.write prefixes(var,options)} if i % probes_per_file == 0
45
45
  end
46
- i+=1
47
- obs_data = observation_data(client,var,i,markers,options)
48
- labels = labels_for(client,var,probe)
46
+ i+=1
47
+ obs_data = observation_data(client,var,i,markers,options)
48
+ labels = labels_for(client,var,probe)
49
49
 
50
- # labels = sanitize(labels)
51
- # return obs_data
50
+ # labels = sanitize(labels)
51
+ # return obs_data
52
52
  if options[:print]
53
53
  observations(meas,dim,codes,obs_data,labels,outvar,options).each{|obs| puts obs}
54
54
  end
@@ -58,119 +58,119 @@ module PubliSci
58
58
  end
59
59
 
60
60
  unless options[:print] || options[:output] == :string
61
- open(outfile_base+"_#{i/probes_per_file}.ttl",'a'){|f| observations(meas,dim,codes,obs_data,labels,outvar,options).map{|obs| f.write obs}}
62
- puts "#{i}/#{probes.size}" unless options[:quiet]
61
+ open(outfile_base+"_#{i/probes_per_file}.ttl",'a'){|f| observations(meas,dim,codes,obs_data,labels,outvar,options).map{|obs| f.write obs}}
62
+ puts "#{i}/#{probes.size}" unless options[:quiet]
63
63
  end
64
- }
64
+ }
65
65
 
66
66
  if options[:output] == :string
67
67
  str
68
68
  end
69
- end
70
-
71
- def structure(client,var,outvar,options={})
72
- meas = measures(client,var,options)
73
- dim = dimensions(client,var,options)
74
- codes = codes(client,var,options)
75
-
76
- str = prefixes(var, options)
77
- str << data_structure_definition(meas,[],codes,outvar,options)
78
- str << dataset(outvar,options)
79
- component_specifications(meas, dim, codes, var, options).map{ |c| str << c }
80
- measure_properties(meas,var,options).map{|m| str << m}
81
-
82
- str
83
- end
84
-
85
- #for now just make everything a measure
86
- def measures(client, var, options={})
87
- if options[:measures]
88
- options[:measures]
89
- else
90
- ["probe","marker","value"]
91
- end
92
- # measure_properties(measures,var,options)
93
- end
94
-
95
- def dimensions(client, var, options={})
96
- # dimension_properties([""],var)
97
- []
98
- end
99
-
100
- def codes(client, var, options={})
101
- []
102
- end
103
-
104
- def labels_for(connection,var,probe_id,options={})
105
- row_names = connection.eval("row.names(#{var})")
106
- # row_names = (1..@rexp.payload.first.to_ruby.size).to_a unless row_names.first
107
- if row_names == connection.eval('NULL')
108
- row_names = (1..connection.eval("nrow(#{var})").payload.first).to_a
109
- else
110
- row_names = row_names.payload
111
- end
112
-
113
- labels = (1..(row_names.size)).to_a.map(&:to_s)
114
- labels = labels.map{|l|
115
- l.insert(0,probe_id.to_s + "_")
116
- }
117
-
118
- labels
119
- end
120
-
121
- def rows(connection,var,options={})
122
- row_names = connection.eval("row.names(#{var})")
123
- #hacky solution because rserve client's .to_ruby method doesn't fully work
124
- if row_names == connection.eval('NULL')
125
- row_names = (1..connection.eval("nrow(#{var})").payload.first).to_a
126
- else
127
- row_names = row_names.payload
128
- end
129
- row_names
130
- end
131
-
132
- def observation_data(client, var, probe_number, row_names, options={})
133
-
134
- data = {}
135
- # geno_chr = client.eval("#{var}$geno$'#{chr}'")
136
- # n_individuals = client.eval("#{var}$pheno[[1]]").to_ruby.size
137
- # entries_per_individual = @rexp.payload["geno"].payload[row_individ].payload["map"].payload.size * @rexp.payload["geno"].payload.names.size
138
- col_label = "probe"
139
- row_label = "marker"
140
- val_label = "value"
141
-
142
- if options[:measures]
143
- col_label = options[:measures][0] || "probe"
144
- row_label = options[:measures][1] || "marker"
145
- val_label = options[:measures][2] || "value"
146
- end
147
-
148
- data["#{col_label}"] = []
149
- data["#{row_label}"] = []
150
- data["#{val_label}"] = []
151
-
152
- # n_individuals.times{|row_individ|
153
- # puts "#{row_individ}/#{n_individuals}"
154
-
155
- col_select = "colnames"
156
- col_select = "names" if options[:type] == :dataframe
157
-
158
- if options[:type] == :dataframe
159
- probe_obj = client.eval("#{var}[[#{probe_number}]]").to_ruby
160
- else
161
- probe_obj = client.eval("#{var}[,#{probe_number}]").to_ruby
162
- end
163
- # puts probe_obj
164
- probe_id = client.eval("#{col_select}(#{var})[[#{probe_number}]]").to_ruby
165
- data["#{col_label}"] = (1..(probe_obj.size)).to_a.fill(probe_id)
166
- probe_obj.each_with_index{|lod,i|
167
- data["#{row_label}"] << row_names[i]
168
- data["#{val_label}"] << lod
169
- }
170
-
171
- data.map{|k,v| v.flatten!}
172
- data
173
- end
174
- end
175
- end
69
+ end
70
+
71
+ def structure(client,var,outvar,options={})
72
+ meas = measures(client,var,options)
73
+ dim = dimensions(client,var,options)
74
+ codes = codes(client,var,options)
75
+
76
+ str = prefixes(var, options)
77
+ str << data_structure_definition(meas,[],codes,outvar,options)
78
+ str << dataset(outvar,options)
79
+ component_specifications(meas, dim, codes, var, options).map{ |c| str << c }
80
+ measure_properties(meas,var,options).map{|m| str << m}
81
+
82
+ str
83
+ end
84
+
85
+ #for now just make everything a measure
86
+ def measures(client, var, options={})
87
+ if options[:measures]
88
+ options[:measures]
89
+ else
90
+ ["probe","marker","value"]
91
+ end
92
+ # measure_properties(measures,var,options)
93
+ end
94
+
95
+ def dimensions(client, var, options={})
96
+ # dimension_properties([""],var)
97
+ []
98
+ end
99
+
100
+ def codes(client, var, options={})
101
+ []
102
+ end
103
+
104
+ def labels_for(connection,var,probe_id,options={})
105
+ row_names = connection.eval("row.names(#{var})")
106
+ # row_names = (1..@rexp.payload.first.to_ruby.size).to_a unless row_names.first
107
+ if row_names == connection.eval('NULL')
108
+ row_names = (1..connection.eval("nrow(#{var})").payload.first).to_a
109
+ else
110
+ row_names = row_names.payload
111
+ end
112
+
113
+ labels = (1..(row_names.size)).to_a.map(&:to_s)
114
+ labels = labels.map{|l|
115
+ l.insert(0,probe_id.to_s + "_")
116
+ }
117
+
118
+ labels
119
+ end
120
+
121
+ def rows(connection,var,options={})
122
+ row_names = connection.eval("row.names(#{var})")
123
+ #hacky solution because rserve client's .to_ruby method doesn't fully work
124
+ if row_names == connection.eval('NULL')
125
+ row_names = (1..connection.eval("nrow(#{var})").payload.first).to_a
126
+ else
127
+ row_names = row_names.payload
128
+ end
129
+ row_names
130
+ end
131
+
132
+ def observation_data(client, var, probe_number, row_names, options={})
133
+
134
+ data = {}
135
+ # geno_chr = client.eval("#{var}$geno$'#{chr}'")
136
+ # n_individuals = client.eval("#{var}$pheno[[1]]").to_ruby.size
137
+ # entries_per_individual = @rexp.payload["geno"].payload[row_individ].payload["map"].payload.size * @rexp.payload["geno"].payload.names.size
138
+ col_label = "probe"
139
+ row_label = "marker"
140
+ val_label = "value"
141
+
142
+ if options[:measures]
143
+ col_label = options[:measures][0] || "probe"
144
+ row_label = options[:measures][1] || "marker"
145
+ val_label = options[:measures][2] || "value"
146
+ end
147
+
148
+ data["#{col_label}"] = []
149
+ data["#{row_label}"] = []
150
+ data["#{val_label}"] = []
151
+
152
+ # n_individuals.times{|row_individ|
153
+ # puts "#{row_individ}/#{n_individuals}"
154
+
155
+ col_select = "colnames"
156
+ col_select = "names" if options[:type] == :dataframe
157
+
158
+ if options[:type] == :dataframe
159
+ probe_obj = client.eval("#{var}[[#{probe_number}]]").to_ruby
160
+ else
161
+ probe_obj = client.eval("#{var}[,#{probe_number}]").to_ruby
162
+ end
163
+ # puts probe_obj
164
+ probe_id = client.eval("#{col_select}(#{var})[[#{probe_number}]]").to_ruby
165
+ data["#{col_label}"] = (1..(probe_obj.size)).to_a.fill(probe_id)
166
+ probe_obj.each_with_index{|lod,i|
167
+ data["#{row_label}"] << row_names[i]
168
+ data["#{val_label}"] << lod
169
+ }
170
+
171
+ data.map{|k,v| v.flatten!}
172
+ data
173
+ end
174
+ end
175
+ end
176
176
  end
@@ -2,7 +2,7 @@ module PubliSci
2
2
  module Writers
3
3
  class ARFF < Base
4
4
  # include PubliSci::Query
5
- # include PubliSci::Parser
5
+ # include PubliSci::RDFParser
6
6
  # include PubliSci::Analyzer
7
7
 
8
8
  def build_arff(relation, attributes, data, source)
@@ -2,7 +2,7 @@ module PubliSci
2
2
  module Writers
3
3
  class Base
4
4
  include PubliSci::Query
5
- include PubliSci::Parser
5
+ include PubliSci::RDFParser
6
6
  include PubliSci::Analyzer
7
7
 
8
8
  def handle_input(input)
@@ -1,20 +1,20 @@
1
- @base <http://onto.strinz.me/dc/dataset/maf_example/> .
2
- @prefix ns: <http://onto.strinz.me/dc/dataset/maf_example/> .
1
+ @base <http://onto.strinz.me/dc/dataset/MAF_ah1iit/> .
2
+ @prefix ns: <http://onto.strinz.me/dc/dataset/MAF_ah1iit/> .
3
3
  @prefix qb: <http://purl.org/linked-data/cube#> .
4
4
  @prefix rdf: <http://www.w3.org/1999/02/22-rdf-syntax-ns#> .
5
5
  @prefix rdfs: <http://www.w3.org/2000/01/rdf-schema#> .
6
6
  @prefix prop: <http://onto.strinz.me/properties/> .
7
7
  @prefix dct: <http://purl.org/dc/terms/> .
8
8
  @prefix xsd: <http://www.w3.org/2001/XMLSchema#> .
9
- @prefix cs: <http://onto.strinz.me/dc/dataset/maf_example/cs/> .
10
- @prefix code: <http://onto.strinz.me/dc/dataset/maf_example/code/> .
9
+ @prefix cs: <http://onto.strinz.me/dc/dataset/MAF_ah1iit/cs/> .
10
+ @prefix code: <http://onto.strinz.me/dc/dataset/MAF_ah1iit/code/> .
11
11
  @prefix owl: <http://www.w3.org/2002/07/owl#> .
12
12
  @prefix skos: <http://www.w3.org/2004/02/skos/core#> .
13
13
  @prefix foaf: <http://xmlns.com/foaf/0.1/> .
14
14
  @prefix org: <http://www.w3.org/ns/org#> .
15
15
  @prefix prov: <http://www.w3.org/ns/prov#> .
16
16
 
17
- ns:dsd-maf_example a qb:DataStructureDefinition;
17
+ ns:dsd-MAF_ah1iit a qb:DataStructureDefinition;
18
18
  qb:component cs:Variant_Classification ;
19
19
  qb:component cs:Variant_Type ;
20
20
  qb:component cs:dbSNP_Val_Status ;
@@ -52,9 +52,9 @@ ns:dsd-maf_example a qb:DataStructureDefinition;
52
52
  qb:component cs:patient_id ;
53
53
  qb:component cs:sample_id .
54
54
 
55
- ns:dataset-maf_example a qb:DataSet ;
56
- rdfs:label "maf_example"@en ;
57
- qb:structure ns:dsd-maf_example .
55
+ ns:dataset-MAF_ah1iit a qb:DataSet ;
56
+ rdfs:label "MAF_ah1iit"@en ;
57
+ qb:structure ns:dsd-MAF_ah1iit .
58
58
 
59
59
  cs:Variant_Classification a qb:ComponentSpecification ;
60
60
  rdfs:label "Variant_Classification" ;
@@ -207,16 +207,13 @@ prop:Entrez_Gene_Id a rdf:Property, qb:MeasureProperty ;
207
207
  rdfs:label "Entrez_Gene_Id"@en .
208
208
 
209
209
  prop:Center a rdf:Property, qb:MeasureProperty ;
210
- rdfs:label "Center"@en ;
211
- rdfs:range xsd:string .
210
+ rdfs:label "Center"@en .
212
211
 
213
212
  prop:NCBI_Build a rdf:Property, qb:MeasureProperty ;
214
- rdfs:label "NCBI_Build"@en ;
215
- rdfs:range xsd:int .
213
+ rdfs:label "NCBI_Build"@en .
216
214
 
217
215
  prop:Chromosome a rdf:Property, qb:MeasureProperty ;
218
- rdfs:label "Chromosome"@en ;
219
- rdfs:range xsd:int .
216
+ rdfs:label "Chromosome"@en .
220
217
 
221
218
  prop:Start_Position a rdf:Property, qb:MeasureProperty ;
222
219
  rdfs:label "Start_Position"@en .
@@ -240,8 +237,7 @@ prop:dbSNP_RS a rdf:Property, qb:MeasureProperty ;
240
237
  rdfs:label "dbSNP_RS"@en .
241
238
 
242
239
  prop:Tumor_Sample_Barcode a rdf:Property, qb:MeasureProperty ;
243
- rdfs:label "Tumor_Sample_Barcode"@en ;
244
- rdfs:range xsd:string .
240
+ rdfs:label "Tumor_Sample_Barcode"@en .
245
241
 
246
242
  prop:Matched_Norm_Sample_Barcode a rdf:Property, qb:MeasureProperty ;
247
243
  rdfs:label "Matched_Norm_Sample_Barcode"@en .
@@ -955,7 +951,7 @@ code:sequencer a skos:ConceptScheme;
955
951
  skos:inScheme code:sequencer .
956
952
 
957
953
  ns:obs2 a qb:Observation ;
958
- qb:dataSet ns:dataset-maf_example ;
954
+ qb:dataSet ns:dataset-MAF_ah1iit ;
959
955
  prop:Variant_Classification <code/variant_classification/Missense_Mutation> ;
960
956
  prop:Variant_Type <code/variant_type/SNP> ;
961
957
  prop:dbSNP_Val_Status <code/dbsnp_val_status/> ;
@@ -990,7 +986,7 @@ ns:obs2 a qb:Observation ;
990
986
  .
991
987
 
992
988
  ns:obs3 a qb:Observation ;
993
- qb:dataSet ns:dataset-maf_example ;
989
+ qb:dataSet ns:dataset-MAF_ah1iit ;
994
990
  prop:Variant_Classification <code/variant_classification/Missense_Mutation> ;
995
991
  prop:Variant_Type <code/variant_type/SNP> ;
996
992
  prop:dbSNP_Val_Status <code/dbsnp_val_status/byFrequency> ;
@@ -1025,7 +1021,7 @@ ns:obs3 a qb:Observation ;
1025
1021
  .
1026
1022
 
1027
1023
  ns:obs4 a qb:Observation ;
1028
- qb:dataSet ns:dataset-maf_example ;
1024
+ qb:dataSet ns:dataset-MAF_ah1iit ;
1029
1025
  prop:Variant_Classification <code/variant_classification/Missense_Mutation> ;
1030
1026
  prop:Variant_Type <code/variant_type/SNP> ;
1031
1027
  prop:dbSNP_Val_Status <code/dbsnp_val_status/> ;
@@ -1061,7 +1057,7 @@ ns:obs4 a qb:Observation ;
1061
1057
  .
1062
1058
 
1063
1059
  ns:obs5 a qb:Observation ;
1064
- qb:dataSet ns:dataset-maf_example ;
1060
+ qb:dataSet ns:dataset-MAF_ah1iit ;
1065
1061
  prop:Variant_Classification <code/variant_classification/Silent> ;
1066
1062
  prop:Variant_Type <code/variant_type/SNP> ;
1067
1063
  prop:dbSNP_Val_Status <code/dbsnp_val_status/> ;
@@ -1097,7 +1093,7 @@ ns:obs5 a qb:Observation ;
1097
1093
  .
1098
1094
 
1099
1095
  ns:obs6 a qb:Observation ;
1100
- qb:dataSet ns:dataset-maf_example ;
1096
+ qb:dataSet ns:dataset-MAF_ah1iit ;
1101
1097
  prop:Variant_Classification <code/variant_classification/Silent> ;
1102
1098
  prop:Variant_Type <code/variant_type/SNP> ;
1103
1099
  prop:dbSNP_Val_Status <code/dbsnp_val_status/> ;
@@ -1132,7 +1128,7 @@ ns:obs6 a qb:Observation ;
1132
1128
  .
1133
1129
 
1134
1130
  ns:obs7 a qb:Observation ;
1135
- qb:dataSet ns:dataset-maf_example ;
1131
+ qb:dataSet ns:dataset-MAF_ah1iit ;
1136
1132
  prop:Variant_Classification <code/variant_classification/Missense_Mutation> ;
1137
1133
  prop:Variant_Type <code/variant_type/SNP> ;
1138
1134
  prop:dbSNP_Val_Status <code/dbsnp_val_status/> ;
@@ -1171,3 +1167,83 @@ ns:obs7 a qb:Observation ;
1171
1167
  prop:sample_id "01A-11D-A14G-09" ;
1172
1168
  .
1173
1169
 
1170
+ ns:obs8 a qb:Observation ;
1171
+ qb:dataSet ns:dataset-MAF_ah1iit ;
1172
+ prop:Variant_Classification <code/variant_classification/Silent> ;
1173
+ prop:Variant_Type <code/variant_type/SNP> ;
1174
+ prop:dbSNP_Val_Status <code/dbsnp_val_status/> ;
1175
+ prop:Verification_Status <code/verification_status/Unknown> ;
1176
+ prop:Validation_Status <code/validation_status/Valid> ;
1177
+ prop:Mutation_Status <code/mutation_status/Somatic> ;
1178
+ prop:Sequence_Source <code/sequence_source/WXS> ;
1179
+ prop:Sequencer <code/sequencer/Illumina_GAIIx> ;
1180
+ prop:Hugo_Symbol <http://identifiers.org/hgnc.symbol/A2BP1> ;
1181
+ prop:Entrez_Gene_Id <http://identifiers.org/ncbigene/54715> ;
1182
+ prop:Center "genome.wustl.edu" ;
1183
+ prop:NCBI_Build 37 ;
1184
+ prop:Chromosome 16 ;
1185
+ prop:Start_Position 7383011 ;
1186
+ prop:End_Position 7383011 ;
1187
+ prop:Strand "+" ;
1188
+ prop:Reference_Allele "G" ;
1189
+ prop:Tumor_Seq_Allele1 "G" ;
1190
+ prop:Tumor_Seq_Allele2 "A" ;
1191
+ prop:dbSNP_RS "novel" ;
1192
+ prop:Tumor_Sample_Barcode "TCGA-AR-A1AJ-01A-21D-A12Q-09" ;
1193
+ prop:Matched_Norm_Sample_Barcode "TCGA-AR-A1AJ-10A-01D-A12Q-09" ;
1194
+ prop:Match_Norm_Seq_Allele1 "G" ;
1195
+ prop:Match_Norm_Seq_Allele2 "G" ;
1196
+ prop:Tumor_Validation_Allele1 "G" ;
1197
+ prop:Tumor_Validation_Allele2 "A" ;
1198
+ prop:Match_Norm_Validation_Allele1 "G" ;
1199
+ prop:Match_Norm_Validation_Allele2 "G" ;
1200
+ prop:Sequencing_Phase "Phase_IV" ;
1201
+ prop:Validation_Method "Illumina_WXS_gDNA" ;
1202
+ prop:Score 1 ;
1203
+ prop:BAM_File "dbGAP" ;
1204
+ prop:Tumor_Sample_UUID "4e1f9084-4729-4b3f-b036-6226d64fd25b" ;
1205
+ prop:Matched_Norm_Sample_UUID "63ee3781-4578-4d19-88e4-c8785fc7987e" ;
1206
+ prop:patient_id "AR-A1AJ" ;
1207
+ prop:sample_id "01A-21D-A12Q-09" ;
1208
+ .
1209
+
1210
+ ns:obs9 a qb:Observation ;
1211
+ qb:dataSet ns:dataset-MAF_ah1iit ;
1212
+ prop:Variant_Classification <code/variant_classification/Nonsense_Mutation> ;
1213
+ prop:Variant_Type <code/variant_type/SNP> ;
1214
+ prop:dbSNP_Val_Status <code/dbsnp_val_status/> ;
1215
+ prop:Verification_Status <code/verification_status/Unknown> ;
1216
+ prop:Validation_Status <code/validation_status/Valid> ;
1217
+ prop:Mutation_Status <code/mutation_status/Somatic> ;
1218
+ prop:Sequence_Source <code/sequence_source/WXS> ;
1219
+ prop:Sequencer <code/sequencer/Illumina_GAIIx> ;
1220
+ prop:Hugo_Symbol <http://identifiers.org/hgnc.symbol/A2M> ;
1221
+ prop:Entrez_Gene_Id <http://identifiers.org/ncbigene/2> ;
1222
+ prop:Center "genome.wustl.edu" ;
1223
+ prop:NCBI_Build 37 ;
1224
+ prop:Chromosome 12 ;
1225
+ prop:Start_Position 9251298 ;
1226
+ prop:End_Position 9251298 ;
1227
+ prop:Strand "+" ;
1228
+ prop:Reference_Allele "G" ;
1229
+ prop:Tumor_Seq_Allele1 "G" ;
1230
+ prop:Tumor_Seq_Allele2 "A" ;
1231
+ prop:dbSNP_RS "novel" ;
1232
+ prop:Tumor_Sample_Barcode "TCGA-A8-A08G-01A-11W-A019-09" ;
1233
+ prop:Matched_Norm_Sample_Barcode "TCGA-A8-A08G-10A-01W-A021-09" ;
1234
+ prop:Match_Norm_Seq_Allele1 "G" ;
1235
+ prop:Match_Norm_Seq_Allele2 "G" ;
1236
+ prop:Tumor_Validation_Allele1 "G" ;
1237
+ prop:Tumor_Validation_Allele2 "A" ;
1238
+ prop:Match_Norm_Validation_Allele1 "G" ;
1239
+ prop:Match_Norm_Validation_Allele2 "G" ;
1240
+ prop:Sequencing_Phase "Phase_IV" ;
1241
+ prop:Validation_Method "Illumina_WXS_gDNA" ;
1242
+ prop:Score 1 ;
1243
+ prop:BAM_File "dbGAP" ;
1244
+ prop:Tumor_Sample_UUID "8da61928-e935-4a33-8e46-840e637163d7" ;
1245
+ prop:Matched_Norm_Sample_UUID "74a3a4af-c93a-4fcd-af11-1f5eeb847c3c" ;
1246
+ prop:patient_id "A8-A08G" ;
1247
+ prop:sample_id "01A-11W-A019-09" ;
1248
+ .
1249
+