ms-sequest 0.0.4 → 0.0.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/History +4 -0
- data/lib/ms/sequest.rb +1 -1
- data/lib/ms/sequest/srf.rb +18 -14
- data/lib/ms/sequest/srf/search.rb +2 -0
- data/lib/ms/sequest/srf/sqt.rb +1 -3
- metadata +2 -2
data/History
CHANGED
data/lib/ms/sequest.rb
CHANGED
data/lib/ms/sequest/srf.rb
CHANGED
@@ -148,19 +148,22 @@ class Ms::Sequest::Srf
|
|
148
148
|
def from_file(filename, opts)
|
149
149
|
opts = { :filter_by_precursor_mass_tolerance => true, :link_protein_hits => true}.merge(opts)
|
150
150
|
params = Ms::Sequest::Srf.get_sequest_params(filename)
|
151
|
-
|
151
|
+
dup_references = 0
|
152
152
|
if params
|
153
|
-
|
154
|
-
if
|
153
|
+
dup_references = params.print_duplicate_references.to_i
|
154
|
+
if dup_references == 0
|
155
155
|
warn <<END
|
156
|
-
|
157
|
-
|
158
|
-
print_duplicate_references
|
159
|
-
|
160
|
-
|
156
|
+
*****************************************************************************
|
157
|
+
WARNING: This srf file lists only 1 protein per peptide! (based on the
|
158
|
+
print_duplicate_references parameter in the sequest.params file used in its
|
159
|
+
creation) So, downstream output will likewise only contain a single protein
|
160
|
+
for each peptide hit. In many instances this is OK since downstream programs
|
161
|
+
will recalculate protein-to-peptide linkages from the database file anyway.
|
162
|
+
For complete protein lists per peptide hit, .srf files must be created with
|
163
|
+
print_duplicate_references > 0. HINT: to capture all duplicate references,
|
164
|
+
set the sequest parameter 'print_duplicate_references' to 100 or greater.
|
165
|
+
*****************************************************************************
|
161
166
|
END
|
162
|
-
else
|
163
|
-
dups_gt_0 = true
|
164
167
|
end
|
165
168
|
else
|
166
169
|
end
|
@@ -179,7 +182,7 @@ END
|
|
179
182
|
end
|
180
183
|
@dta_files, measured_mhs = read_dta_files(fh,@header.num_dta_files, unpack_35)
|
181
184
|
|
182
|
-
@out_files = read_out_files(fh,@header.num_dta_files, measured_mhs, unpack_35)
|
185
|
+
@out_files = read_out_files(fh,@header.num_dta_files, measured_mhs, unpack_35, dup_references)
|
183
186
|
if fh.eof?
|
184
187
|
#warn "FILE: '#{filename}' appears to be an abortive run (no params in srf file)\nstill continuing..."
|
185
188
|
@params = nil
|
@@ -257,10 +260,10 @@ END
|
|
257
260
|
|
258
261
|
# filehandle (fh) must be at the start of the outfiles. 'read_dta_files'
|
259
262
|
# will put the fh there.
|
260
|
-
def read_out_files(fh,number_files, measured_mhs, unpack_35)
|
263
|
+
def read_out_files(fh,number_files, measured_mhs, unpack_35, dup_references)
|
261
264
|
out_files = Array.new(number_files)
|
262
265
|
header.num_dta_files.times do |i|
|
263
|
-
out_files[i] = Ms::Sequest::Srf::Out.new.from_io(fh, unpack_35)
|
266
|
+
out_files[i] = Ms::Sequest::Srf::Out.new.from_io(fh, unpack_35, dup_references)
|
264
267
|
end
|
265
268
|
out_files
|
266
269
|
end
|
@@ -467,7 +470,7 @@ class Ms::Sequest::Srf::Out
|
|
467
470
|
"<Ms::Sequest::Srf::Out first_scan=#{first_scan}, last_scan=#{last_scan}, charge=#{charge}, num_hits=#{num_hits}, computer=#{computer}, date_time=#{date_time}#{hits_s}>"
|
468
471
|
end
|
469
472
|
|
470
|
-
def from_io(fh, unpack_35)
|
473
|
+
def from_io(fh, unpack_35, dup_references)
|
471
474
|
## EMPTY out file is 96 bytes
|
472
475
|
## each hit is 320 bytes
|
473
476
|
## num_hits and charge:
|
@@ -484,6 +487,7 @@ class Ms::Sequest::Srf::Out
|
|
484
487
|
ar[i] = Ms::Sequest::Srf::Out::Pep.new.from_io(fh, unpack_35)
|
485
488
|
num_extra_references += ar[i].num_other_loci
|
486
489
|
end
|
490
|
+
num_extra_references = dup_references if num_extra_references > dup_references
|
487
491
|
Ms::Sequest::Srf::Out::Pep.read_extra_references(fh, num_extra_references, ar)
|
488
492
|
## The xcorrs are already ordered by best to worst hit
|
489
493
|
## ADJUST the deltacn's to be meaningful for the top hit:
|
data/lib/ms/sequest/srf/sqt.rb
CHANGED
@@ -1,5 +1,4 @@
|
|
1
1
|
require 'tap/task'
|
2
|
-
require 'configurable'
|
3
2
|
require 'ms/sequest'
|
4
3
|
require 'ms/sequest/srf'
|
5
4
|
require 'ms/sequest/sqt'
|
@@ -59,8 +58,7 @@ module Ms
|
|
59
58
|
'Comment' => ['Created from Bioworks .srf file']
|
60
59
|
}
|
61
60
|
|
62
|
-
|
63
|
-
db_filename = header.db_filename
|
61
|
+
db_filename = header.db_filename.sub(/\.hdr$/, '') # remove the .hdr postfix
|
64
62
|
db_filename_in_sqt = db_filename
|
65
63
|
if opt[:new_db_path]
|
66
64
|
db_filename = File.join(opt[:new_db_path], File.basename(db_filename.gsub('\\', '/')))
|
metadata
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: ms-sequest
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.0.
|
4
|
+
version: 0.0.5
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- John Prince
|
@@ -9,7 +9,7 @@ autorequire:
|
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
11
|
|
12
|
-
date: 2009-06-
|
12
|
+
date: 2009-06-22 00:00:00 -06:00
|
13
13
|
default_executable:
|
14
14
|
dependencies:
|
15
15
|
- !ruby/object:Gem::Dependency
|