mspire 0.2.4 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (233) hide show
  1. data/INSTALL +1 -0
  2. data/README +25 -0
  3. data/Rakefile +129 -40
  4. data/bin/{find_aa_freq.rb → aafreqs.rb} +2 -2
  5. data/bin/bioworks_to_pepxml.rb +1 -0
  6. data/bin/fasta_shaker.rb +1 -96
  7. data/bin/filter_and_validate.rb +5 -0
  8. data/bin/{mzxml_to_lmat.rb → ms_to_lmat.rb} +8 -7
  9. data/bin/prob_validate.rb +6 -0
  10. data/bin/raw_to_mzXML.rb +2 -2
  11. data/bin/srf_group.rb +1 -0
  12. data/bin/srf_to_sqt.rb +40 -0
  13. data/changelog.txt +68 -0
  14. data/lib/align/chams.rb +6 -6
  15. data/lib/align.rb +4 -3
  16. data/lib/bsearch.rb +120 -0
  17. data/lib/fasta.rb +318 -86
  18. data/lib/group_by.rb +10 -0
  19. data/lib/index_by.rb +11 -0
  20. data/lib/merge_deep.rb +21 -0
  21. data/lib/{spec → ms/converter}/mzxml.rb +77 -109
  22. data/lib/ms/gradient_program.rb +171 -0
  23. data/lib/ms/msrun.rb +209 -0
  24. data/lib/{spec/msrun.rb → ms/msrun_index.rb} +7 -40
  25. data/lib/ms/parser/mzdata/axml.rb +12 -0
  26. data/lib/ms/parser/mzdata/dom.rb +160 -0
  27. data/lib/ms/parser/mzdata/libxml.rb +7 -0
  28. data/lib/ms/parser/mzdata.rb +25 -0
  29. data/lib/ms/parser/mzxml/axml.rb +11 -0
  30. data/lib/ms/parser/mzxml/dom.rb +159 -0
  31. data/lib/ms/parser/mzxml/hpricot.rb +253 -0
  32. data/lib/ms/parser/mzxml/libxml.rb +15 -0
  33. data/lib/ms/parser/mzxml/regexp.rb +122 -0
  34. data/lib/ms/parser/mzxml/rexml.rb +72 -0
  35. data/lib/ms/parser/mzxml/xmlparser.rb +248 -0
  36. data/lib/ms/parser/mzxml.rb +175 -0
  37. data/lib/ms/parser.rb +108 -0
  38. data/lib/ms/precursor.rb +10 -0
  39. data/lib/ms/scan.rb +81 -0
  40. data/lib/ms/spectrum.rb +193 -0
  41. data/lib/ms.rb +10 -0
  42. data/lib/mspire.rb +4 -0
  43. data/lib/roc.rb +61 -1
  44. data/lib/sample_enzyme.rb +31 -8
  45. data/lib/scan_i.rb +21 -0
  46. data/lib/spec_id/aa_freqs.rb +7 -3
  47. data/lib/spec_id/bioworks.rb +20 -14
  48. data/lib/spec_id/digestor.rb +139 -0
  49. data/lib/spec_id/mass.rb +116 -0
  50. data/lib/spec_id/parser/proph.rb +236 -0
  51. data/lib/spec_id/precision/filter/cmdline.rb +209 -0
  52. data/lib/spec_id/precision/filter/interactive.rb +134 -0
  53. data/lib/spec_id/precision/filter/output.rb +147 -0
  54. data/lib/spec_id/precision/filter.rb +623 -0
  55. data/lib/spec_id/precision/output.rb +60 -0
  56. data/lib/spec_id/precision/prob/cmdline.rb +139 -0
  57. data/lib/spec_id/precision/prob/output.rb +88 -0
  58. data/lib/spec_id/precision/prob.rb +171 -0
  59. data/lib/spec_id/proph/pep_summary.rb +92 -0
  60. data/lib/spec_id/proph/prot_summary.rb +484 -0
  61. data/lib/spec_id/proph.rb +2 -466
  62. data/lib/spec_id/protein_summary.rb +2 -2
  63. data/lib/spec_id/sequest/params.rb +316 -0
  64. data/lib/spec_id/sequest/pepxml.rb +1513 -0
  65. data/lib/spec_id/sequest.rb +2 -1672
  66. data/lib/spec_id/srf.rb +445 -177
  67. data/lib/spec_id.rb +183 -95
  68. data/lib/spec_id_xml.rb +8 -10
  69. data/lib/transmem/phobius.rb +147 -0
  70. data/lib/transmem/toppred.rb +368 -0
  71. data/lib/transmem.rb +157 -0
  72. data/lib/validator/aa.rb +135 -0
  73. data/lib/validator/background.rb +73 -0
  74. data/lib/validator/bias.rb +95 -0
  75. data/lib/validator/cmdline.rb +260 -0
  76. data/lib/validator/decoy.rb +94 -0
  77. data/lib/validator/digestion_based.rb +69 -0
  78. data/lib/validator/probability.rb +48 -0
  79. data/lib/validator/prot_from_pep.rb +234 -0
  80. data/lib/validator/transmem.rb +272 -0
  81. data/lib/validator/true_pos.rb +46 -0
  82. data/lib/validator.rb +214 -0
  83. data/lib/xml.rb +38 -0
  84. data/lib/xml_style_parser.rb +105 -0
  85. data/lib/xmlparser_wrapper.rb +19 -0
  86. data/script/compile_and_plot_smriti_final.rb +97 -0
  87. data/script/extract_gradient_programs.rb +56 -0
  88. data/script/get_apex_values_rexml.rb +44 -0
  89. data/script/mzXML2timeIndex.rb +1 -1
  90. data/script/smriti_final_analysis.rb +103 -0
  91. data/script/toppred_to_yaml.rb +47 -0
  92. data/script/tpp_installer.rb +1 -1
  93. data/{test/tc_align.rb → specs/align_spec.rb} +21 -27
  94. data/{test/tc_bioworks_to_pepxml.rb → specs/bin/bioworks_to_pepxml_spec.rb} +25 -41
  95. data/specs/bin/fasta_shaker_spec.rb +259 -0
  96. data/specs/bin/filter_and_validate__multiple_vals_helper.yaml +202 -0
  97. data/specs/bin/filter_and_validate_spec.rb +124 -0
  98. data/specs/bin/ms_to_lmat_spec.rb +34 -0
  99. data/specs/bin/prob_validate_spec.rb +62 -0
  100. data/specs/bin/protein_summary_spec.rb +10 -0
  101. data/{test/tc_fasta.rb → specs/fasta_spec.rb} +354 -310
  102. data/specs/gi_spec.rb +22 -0
  103. data/specs/load_bin_path.rb +7 -0
  104. data/specs/merge_deep_spec.rb +13 -0
  105. data/specs/ms/gradient_program_spec.rb +77 -0
  106. data/specs/ms/msrun_spec.rb +455 -0
  107. data/specs/ms/parser_spec.rb +92 -0
  108. data/specs/ms/spectrum_spec.rb +89 -0
  109. data/specs/roc_spec.rb +251 -0
  110. data/specs/rspec_autotest.rb +149 -0
  111. data/specs/sample_enzyme_spec.rb +41 -0
  112. data/specs/spec_helper.rb +133 -0
  113. data/specs/spec_id/aa_freqs_spec.rb +52 -0
  114. data/{test/tc_bioworks.rb → specs/spec_id/bioworks_spec.rb} +56 -71
  115. data/specs/spec_id/digestor_spec.rb +75 -0
  116. data/specs/spec_id/precision/filter/cmdline_spec.rb +20 -0
  117. data/specs/spec_id/precision/filter/output_spec.rb +31 -0
  118. data/specs/spec_id/precision/filter_spec.rb +243 -0
  119. data/specs/spec_id/precision/prob_spec.rb +111 -0
  120. data/specs/spec_id/precision/prob_spec_helper.rb +0 -0
  121. data/specs/spec_id/proph/pep_summary_spec.rb +143 -0
  122. data/{test/tc_proph.rb → specs/spec_id/proph/prot_summary_spec.rb} +52 -32
  123. data/{test/tc_protein_summary.rb → specs/spec_id/protein_summary_spec.rb} +85 -0
  124. data/specs/spec_id/sequest/params_spec.rb +68 -0
  125. data/specs/spec_id/sequest/pepxml_spec.rb +452 -0
  126. data/specs/spec_id/sqt_spec.rb +138 -0
  127. data/specs/spec_id/srf_spec.rb +209 -0
  128. data/specs/spec_id/srf_spec_helper.rb +302 -0
  129. data/specs/spec_id_helper.rb +33 -0
  130. data/specs/spec_id_spec.rb +361 -0
  131. data/specs/spec_id_xml_spec.rb +33 -0
  132. data/specs/transmem/phobius_spec.rb +423 -0
  133. data/specs/transmem/toppred_spec.rb +297 -0
  134. data/specs/transmem_spec.rb +60 -0
  135. data/specs/transmem_spec_shared.rb +64 -0
  136. data/specs/validator/aa_spec.rb +107 -0
  137. data/specs/validator/background_spec.rb +51 -0
  138. data/specs/validator/bias_spec.rb +146 -0
  139. data/specs/validator/decoy_spec.rb +51 -0
  140. data/specs/validator/fasta_helper.rb +26 -0
  141. data/specs/validator/prot_from_pep_spec.rb +141 -0
  142. data/specs/validator/transmem_spec.rb +145 -0
  143. data/specs/validator/true_pos_spec.rb +58 -0
  144. data/specs/validator_helper.rb +33 -0
  145. data/specs/xml_spec.rb +12 -0
  146. data/test_files/000_pepxml18_small.xml +206 -0
  147. data/test_files/020a.mzXML.timeIndex +4710 -0
  148. data/test_files/4-03-03_mzXML/000.mzXML.timeIndex +3973 -0
  149. data/test_files/4-03-03_mzXML/020.mzXML.timeIndex +3872 -0
  150. data/test_files/4-03-03_small-prot.xml +321 -0
  151. data/test_files/4-03-03_small.xml +3876 -0
  152. data/test_files/7MIX_STD_110802_1.sequest_params_fragment.srf +0 -0
  153. data/test_files/bioworks-3.3_10prots.xml +5999 -0
  154. data/test_files/bioworks31.params +77 -0
  155. data/test_files/bioworks32.params +62 -0
  156. data/test_files/bioworks33.params +63 -0
  157. data/test_files/bioworks_single_run_small.xml +7237 -0
  158. data/test_files/bioworks_small.fasta +212 -0
  159. data/test_files/bioworks_small.params +63 -0
  160. data/test_files/bioworks_small.phobius +109 -0
  161. data/test_files/bioworks_small.toppred.out +2847 -0
  162. data/test_files/bioworks_small.xml +5610 -0
  163. data/test_files/bioworks_with_INV_small.xml +3753 -0
  164. data/test_files/bioworks_with_SHUFF_small.xml +2503 -0
  165. data/test_files/corrupted_900.srf +0 -0
  166. data/test_files/head_of_7MIX.srf +0 -0
  167. data/test_files/interact-opd1_mods_small-prot.xml +304 -0
  168. data/test_files/messups.fasta +297 -0
  169. data/test_files/opd1/000.my_answer.100lines.xml +101 -0
  170. data/test_files/opd1/000.tpp_1.2.3.first10.xml +115 -0
  171. data/test_files/opd1/000.tpp_2.9.2.first10.xml +126 -0
  172. data/test_files/opd1/000.v2.1.mzXML.timeIndex +3748 -0
  173. data/test_files/opd1/000_020-prot.png +0 -0
  174. data/test_files/opd1/000_020_3prots-prot.mod_initprob.xml +62 -0
  175. data/test_files/opd1/000_020_3prots-prot.xml +62 -0
  176. data/test_files/opd1/opd1_cat_inv_small-prot.xml +139 -0
  177. data/test_files/opd1/sequest.3.1.params +77 -0
  178. data/test_files/opd1/sequest.3.2.params +62 -0
  179. data/test_files/opd1/twenty_scans.mzXML +418 -0
  180. data/test_files/opd1/twenty_scans.v2.1.mzXML +382 -0
  181. data/test_files/opd1/twenty_scans_answ.lmat +0 -0
  182. data/test_files/opd1/twenty_scans_answ.lmata +9 -0
  183. data/test_files/opd1_020_beginning.RAW +0 -0
  184. data/test_files/opd1_2runs_2mods/interact-opd1_mods__small.xml +753 -0
  185. data/test_files/orbitrap_mzData/000_cut.xml +1920 -0
  186. data/test_files/pepproph_small.xml +4691 -0
  187. data/test_files/phobius.small.noheader.txt +50 -0
  188. data/test_files/phobius.small.small.txt +53 -0
  189. data/test_files/s01_anC1_ld020mM.key.txt +25 -0
  190. data/test_files/s01_anC1_ld020mM.meth +0 -0
  191. data/test_files/small.fasta +297 -0
  192. data/test_files/smallraw.RAW +0 -0
  193. data/test_files/tf_bioworks2excel.bioXML +14340 -0
  194. data/test_files/tf_bioworks2excel.txt.actual +1035 -0
  195. data/test_files/toppred.small.out +416 -0
  196. data/test_files/toppred.xml.out +318 -0
  197. data/test_files/validator_hits_separate/bias_bioworks_small_HS.fasta +7 -0
  198. data/test_files/validator_hits_separate/bioworks_small_HS.xml +5651 -0
  199. data/test_files/yeast_gly_small-prot.xml +265 -0
  200. data/test_files/yeast_gly_small.1.0_1.0_1.0.parentTimes +6 -0
  201. data/test_files/yeast_gly_small.xml +3807 -0
  202. data/test_files/yeast_gly_small2.parentTimes +6 -0
  203. metadata +273 -57
  204. data/bin/filter.rb +0 -6
  205. data/bin/precision.rb +0 -5
  206. data/lib/spec/mzdata/parser.rb +0 -108
  207. data/lib/spec/mzdata.rb +0 -48
  208. data/lib/spec/mzxml/parser.rb +0 -449
  209. data/lib/spec/scan.rb +0 -55
  210. data/lib/spec_id/filter.rb +0 -797
  211. data/lib/spec_id/precision.rb +0 -421
  212. data/lib/toppred.rb +0 -18
  213. data/script/filter-peps.rb +0 -164
  214. data/test/tc_aa_freqs.rb +0 -59
  215. data/test/tc_fasta_shaker.rb +0 -149
  216. data/test/tc_filter.rb +0 -203
  217. data/test/tc_filter_peps.rb +0 -46
  218. data/test/tc_gi.rb +0 -17
  219. data/test/tc_id_class_anal.rb +0 -70
  220. data/test/tc_id_precision.rb +0 -89
  221. data/test/tc_msrun.rb +0 -88
  222. data/test/tc_mzxml.rb +0 -88
  223. data/test/tc_mzxml_to_lmat.rb +0 -36
  224. data/test/tc_peptide_parent_times.rb +0 -27
  225. data/test/tc_precision.rb +0 -60
  226. data/test/tc_roc.rb +0 -166
  227. data/test/tc_sample_enzyme.rb +0 -32
  228. data/test/tc_scan.rb +0 -26
  229. data/test/tc_sequest.rb +0 -336
  230. data/test/tc_spec.rb +0 -78
  231. data/test/tc_spec_id.rb +0 -201
  232. data/test/tc_spec_id_xml.rb +0 -36
  233. data/test/tc_srf.rb +0 -262
@@ -0,0 +1,6 @@
1
+ # PROTCUTOFF: 1.0 NSPPEPCUTOFF: 1.0 INITPEPCUTOFF: 1.0
2
+ # These are the times of the precursor scan!
3
+ # filename sequence charge time1 prec_mz prec_int time2 ...
4
+ 020a EVIDTILALVK 2 5575.870000 610.063965 4030201.000000 5537.900000 615.687988 9531986.000000
5
+ 020a TPANAAVPASTPLK 2 1037.230000 669.406616 6435475.000000 1030.090000 672.593262 5464264.000000
6
+ 020a YVRPPIIVGDLSR 3 2772.160000 498.767334 3464513.000000 2755.730000 493.924683 2817155.000000
metadata CHANGED
@@ -3,8 +3,8 @@ rubygems_version: 0.9.2
3
3
  specification_version: 1
4
4
  name: mspire
5
5
  version: !ruby/object:Gem::Version
6
- version: 0.2.4
7
- date: 2007-05-17 00:00:00 -05:00
6
+ version: 0.3.0
7
+ date: 2007-12-13 00:00:00 -06:00
8
8
  summary: Mass Spectrometry Proteomics Objects, Scripts, and Executables
9
9
  require_paths:
10
10
  - lib
@@ -29,43 +29,105 @@ post_install_message:
29
29
  authors:
30
30
  - John Prince
31
31
  files:
32
+ - INSTALL
33
+ - README
34
+ - Rakefile
35
+ - LICENSE
36
+ - changelog.txt
37
+ - release_notes.txt
32
38
  - lib/spec_id
33
39
  - lib/align
34
- - lib/spec
40
+ - lib/ms
35
41
  - lib/spec_id.rb
36
42
  - lib/fasta.rb
37
43
  - lib/align.rb
38
44
  - lib/sample_enzyme.rb
45
+ - lib/ms.rb
39
46
  - lib/gi.rb
40
47
  - lib/roc.rb
41
48
  - lib/spec_id_xml.rb
42
- - lib/toppred.rb
49
+ - lib/validator.rb
50
+ - lib/transmem
51
+ - lib/transmem.rb
52
+ - lib/xml_style_parser.rb
53
+ - lib/xmlparser_wrapper.rb
54
+ - lib/bsearch.rb
55
+ - lib/group_by.rb
56
+ - lib/xml.rb
57
+ - lib/merge_deep.rb
58
+ - lib/index_by.rb
59
+ - lib/validator
60
+ - lib/mspire.rb
61
+ - lib/scan_i.rb
43
62
  - lib/spec_id/sequest.rb
44
63
  - lib/spec_id/bioworks.rb
45
64
  - lib/spec_id/proph.rb
46
- - lib/spec_id/precision.rb
65
+ - lib/spec_id/parser
47
66
  - lib/spec_id/srf.rb
48
67
  - lib/spec_id/aa_freqs.rb
49
68
  - lib/spec_id/protein_summary.rb
50
- - lib/spec_id/filter.rb
69
+ - lib/spec_id/precision
70
+ - lib/spec_id/digestor.rb
71
+ - lib/spec_id/proph
72
+ - lib/spec_id/sequest
73
+ - lib/spec_id/mass.rb
74
+ - lib/spec_id/parser/proph.rb
75
+ - lib/spec_id/precision/prob.rb
76
+ - lib/spec_id/precision/filter
77
+ - lib/spec_id/precision/filter.rb
78
+ - lib/spec_id/precision/prob
79
+ - lib/spec_id/precision/output.rb
80
+ - lib/spec_id/precision/filter/interactive.rb
81
+ - lib/spec_id/precision/filter/output.rb
82
+ - lib/spec_id/precision/filter/cmdline.rb
83
+ - lib/spec_id/precision/prob/output.rb
84
+ - lib/spec_id/precision/prob/cmdline.rb
85
+ - lib/spec_id/proph/pep_summary.rb
86
+ - lib/spec_id/proph/prot_summary.rb
87
+ - lib/spec_id/sequest/params.rb
88
+ - lib/spec_id/sequest/pepxml.rb
51
89
  - lib/align/chams.rb
52
- - lib/spec/mzxml
53
- - lib/spec/mzdata
54
- - lib/spec/msrun.rb
55
- - lib/spec/scan.rb
56
- - lib/spec/mzxml.rb
57
- - lib/spec/mzdata.rb
58
- - lib/spec/mzxml/parser.rb
59
- - lib/spec/mzdata/parser.rb
60
- - INSTALL
61
- - README
62
- - Rakefile
63
- - LICENSE
64
- - changelog.txt
65
- - release_notes.txt
90
+ - lib/ms/converter
91
+ - lib/ms/parser
92
+ - lib/ms/spectrum.rb
93
+ - lib/ms/gradient_program.rb
94
+ - lib/ms/msrun.rb
95
+ - lib/ms/precursor.rb
96
+ - lib/ms/scan.rb
97
+ - lib/ms/msrun_index.rb
98
+ - lib/ms/parser.rb
99
+ - lib/ms/converter/mzxml.rb
100
+ - lib/ms/parser/mzdata
101
+ - lib/ms/parser/mzxml
102
+ - lib/ms/parser/mzdata.rb
103
+ - lib/ms/parser/mzxml.rb
104
+ - lib/ms/parser/mzdata/libxml.rb
105
+ - lib/ms/parser/mzdata/axml.rb
106
+ - lib/ms/parser/mzdata/dom.rb
107
+ - lib/ms/parser/mzxml/xmlparser.rb
108
+ - lib/ms/parser/mzxml/libxml.rb
109
+ - lib/ms/parser/mzxml/rexml.rb
110
+ - lib/ms/parser/mzxml/regexp.rb
111
+ - lib/ms/parser/mzxml/axml.rb
112
+ - lib/ms/parser/mzxml/hpricot.rb
113
+ - lib/ms/parser/mzxml/dom.rb
114
+ - lib/transmem/toppred.rb
115
+ - lib/transmem/phobius.rb
116
+ - lib/validator/prot_from_pep.rb
117
+ - lib/validator/true_pos.rb
118
+ - lib/validator/aa.rb
119
+ - lib/validator/decoy.rb
120
+ - lib/validator/transmem.rb
121
+ - lib/validator/cmdline.rb
122
+ - lib/validator/bias.rb
123
+ - lib/validator/background.rb
124
+ - lib/validator/digestion_based.rb
125
+ - lib/validator/probability.rb
66
126
  - bin/bioworks_to_pepxml_gui.rb
67
127
  - bin/gi2annot.rb
68
128
  - bin/protein_summary.rb
129
+ - bin/ms_to_lmat.rb
130
+ - bin/aafreqs.rb
69
131
  - bin/bioworks2excel.rb
70
132
  - bin/pepproph_filter.rb
71
133
  - bin/fasta_shaker.rb
@@ -73,11 +135,10 @@ files:
73
135
  - bin/protxml2prots_peps.rb
74
136
  - bin/id_precision.rb
75
137
  - bin/id_class_anal.rb
76
- - bin/mzxml_to_lmat.rb
77
- - bin/find_aa_freq.rb
78
- - bin/filter.rb
138
+ - bin/prob_validate.rb
139
+ - bin/srf_to_sqt.rb
140
+ - bin/filter_and_validate.rb
79
141
  - bin/srf_group.rb
80
- - bin/precision.rb
81
142
  - bin/raw_to_mzXML.rb
82
143
  - script/create_little_pepxml.rb
83
144
  - script/mzXML2timeIndex.rb
@@ -86,39 +147,184 @@ files:
86
147
  - script/histogram_probs.rb
87
148
  - script/prep_dir.rb
88
149
  - script/top_hit_per_scan.rb
89
- - script/filter-peps.rb
90
150
  - script/genuine_tps_and_probs.rb
151
+ - script/compile_and_plot_smriti_final.rb
91
152
  - script/simple_protein_digestion.rb
92
153
  - script/estimate_fpr_by_cysteine.rb
93
154
  - script/find_cysteine_background.rb
94
155
  - script/degenerate_peptides.rb
156
+ - script/smriti_final_analysis.rb
157
+ - script/toppred_to_yaml.rb
158
+ - script/get_apex_values_rexml.rb
159
+ - script/extract_gradient_programs.rb
160
+ - specs/transmem_spec.rb
161
+ - specs/roc_spec.rb
162
+ - specs/ms
163
+ - specs/load_bin_path.rb
164
+ - specs/validator
165
+ - specs/spec_helper.rb
166
+ - specs/transmem
167
+ - specs/spec_id
168
+ - specs/spec_id_helper.rb
169
+ - specs/fasta_spec.rb
170
+ - specs/gi_spec.rb
171
+ - specs/bin
172
+ - specs/validator_helper.rb
173
+ - specs/merge_deep_spec.rb
174
+ - specs/xml_spec.rb
175
+ - specs/spec_id_spec.rb
176
+ - specs/align_spec.rb
177
+ - specs/rspec_autotest.rb
178
+ - specs/sample_enzyme_spec.rb
179
+ - specs/spec_id_xml_spec.rb
180
+ - specs/transmem_spec_shared.rb
181
+ - specs/ms/gradient_program_spec.rb
182
+ - specs/ms/msrun_spec.rb
183
+ - specs/ms/parser_spec.rb
184
+ - specs/ms/spectrum_spec.rb
185
+ - specs/validator/background_spec.rb
186
+ - specs/validator/decoy_spec.rb
187
+ - specs/validator/transmem_spec.rb
188
+ - specs/validator/true_pos_spec.rb
189
+ - specs/validator/prot_from_pep_spec.rb
190
+ - specs/validator/aa_spec.rb
191
+ - specs/validator/fasta_helper.rb
192
+ - specs/validator/bias_spec.rb
193
+ - specs/transmem/toppred_spec.rb
194
+ - specs/transmem/phobius_spec.rb
195
+ - specs/spec_id/bioworks_spec.rb
196
+ - specs/spec_id/aa_freqs_spec.rb
197
+ - specs/spec_id/srf_spec.rb
198
+ - specs/spec_id/precision
199
+ - specs/spec_id/srf_spec_helper.rb
200
+ - specs/spec_id/sequest
201
+ - specs/spec_id/digestor_spec.rb
202
+ - specs/spec_id/protein_summary_spec.rb
203
+ - specs/spec_id/proph
204
+ - specs/spec_id/sqt_spec.rb
205
+ - specs/spec_id/precision/filter
206
+ - specs/spec_id/precision/prob_spec.rb
207
+ - specs/spec_id/precision/filter_spec.rb
208
+ - specs/spec_id/precision/prob_spec_helper.rb
209
+ - specs/spec_id/precision/filter/cmdline_spec.rb
210
+ - specs/spec_id/precision/filter/output_spec.rb
211
+ - specs/spec_id/sequest/params_spec.rb
212
+ - specs/spec_id/sequest/pepxml_spec.rb
213
+ - specs/spec_id/proph/prot_summary_spec.rb
214
+ - specs/spec_id/proph/pep_summary_spec.rb
215
+ - specs/bin/filter_and_validate_spec.rb
216
+ - specs/bin/fasta_shaker_spec.rb
217
+ - specs/bin/bioworks_to_pepxml_spec.rb
218
+ - specs/bin/protein_summary_spec.rb
219
+ - specs/bin/ms_to_lmat_spec.rb
220
+ - specs/bin/filter_and_validate__multiple_vals_helper.yaml
221
+ - specs/bin/prob_validate_spec.rb
222
+ - test_files/4-03-03_mzXML
223
+ - test_files/opd1
224
+ - test_files/orbitrap_mzData
225
+ - test_files/messups.fasta
226
+ - test_files/small.fasta
227
+ - test_files/toppred.xml.out
228
+ - test_files/smallraw.RAW
229
+ - test_files/bioworks_single_run_small.xml
230
+ - test_files/tf_bioworks2excel.txt.actual
231
+ - test_files/pepproph_small.xml
232
+ - test_files/000_pepxml18_small.xml
233
+ - test_files/tf_bioworks2excel.bioXML
234
+ - test_files/bioworks31.params
235
+ - test_files/bioworks_small.xml
236
+ - test_files/bioworks32.params
237
+ - test_files/yeast_gly_small.xml
238
+ - test_files/4-03-03_small.xml
239
+ - test_files/bioworks_with_INV_small.xml
240
+ - test_files/020a.mzXML.timeIndex
241
+ - test_files/yeast_gly_small2.parentTimes
242
+ - test_files/s01_anC1_ld020mM.meth
243
+ - test_files/yeast_gly_small-prot.xml
244
+ - test_files/bioworks-3.3_10prots.xml
245
+ - test_files/4-03-03_small-prot.xml
246
+ - test_files/bioworks33.params
247
+ - test_files/head_of_7MIX.srf
248
+ - test_files/yeast_gly_small.1.0_1.0_1.0.parentTimes
249
+ - test_files/bioworks_with_SHUFF_small.xml
250
+ - test_files/toppred.small.out
251
+ - test_files/phobius.small.small.txt
252
+ - test_files/s01_anC1_ld020mM.key.txt
253
+ - test_files/7MIX_STD_110802_1.sequest_params_fragment.srf
254
+ - test_files/phobius.small.noheader.txt
255
+ - test_files/interact-opd1_mods_small-prot.xml
256
+ - test_files/corrupted_900.srf
257
+ - test_files/validator_hits_separate
258
+ - test_files/bioworks_small.phobius
259
+ - test_files/bioworks_small.params
260
+ - test_files/bioworks_small.toppred.out
261
+ - test_files/bioworks_small.fasta
262
+ - test_files/opd1_020_beginning.RAW
263
+ - test_files/opd1_2runs_2mods
264
+ - test_files/4-03-03_mzXML/000.mzXML.timeIndex
265
+ - test_files/4-03-03_mzXML/020.mzXML.timeIndex
266
+ - test_files/opd1/opd1_cat_inv_small-prot.xml
267
+ - test_files/opd1/000.v2.1.mzXML.timeIndex
268
+ - test_files/opd1/000.tpp_2.9.2.first10.xml
269
+ - test_files/opd1/000_020-prot.png
270
+ - test_files/opd1/twenty_scans.mzXML
271
+ - test_files/opd1/000.my_answer.100lines.xml
272
+ - test_files/opd1/twenty_scans_answ.lmat
273
+ - test_files/opd1/twenty_scans_answ.lmata
274
+ - test_files/opd1/000.tpp_1.2.3.first10.xml
275
+ - test_files/opd1/sequest.3.1.params
276
+ - test_files/opd1/000_020_3prots-prot.xml
277
+ - test_files/opd1/twenty_scans.v2.1.mzXML
278
+ - test_files/opd1/sequest.3.2.params
279
+ - test_files/opd1/000_020_3prots-prot.mod_initprob.xml
280
+ - test_files/orbitrap_mzData/000_cut.xml
281
+ - test_files/validator_hits_separate/bioworks_small_HS.xml
282
+ - test_files/validator_hits_separate/bias_bioworks_small_HS.fasta
283
+ - test_files/opd1_2runs_2mods/interact-opd1_mods__small.xml
95
284
  test_files:
96
- - test/tc_aa_freqs.rb
97
- - test/tc_proph.rb
98
- - test/tc_gi.rb
99
- - test/tc_align.rb
100
- - test/tc_sequest.rb
101
- - test/tc_spec.rb
102
- - test/tc_bioworks.rb
103
- - test/tc_protein_summary.rb
104
- - test/tc_fasta.rb
105
- - test/tc_msrun.rb
106
- - test/tc_peptide_parent_times.rb
107
- - test/tc_spec_id.rb
108
- - test/tc_mzxml.rb
109
- - test/tc_srf.rb
110
- - test/tc_id_precision.rb
111
- - test/tc_id_class_anal.rb
112
- - test/tc_filter_peps.rb
113
- - test/tc_precision.rb
114
- - test/tc_filter.rb
115
- - test/tc_roc.rb
116
- - test/tc_scan.rb
117
- - test/tc_bioworks_to_pepxml.rb
118
- - test/tc_mzxml_to_lmat.rb
119
- - test/tc_fasta_shaker.rb
120
- - test/tc_sample_enzyme.rb
121
- - test/tc_spec_id_xml.rb
285
+ - specs/transmem_spec.rb
286
+ - specs/roc_spec.rb
287
+ - specs/fasta_spec.rb
288
+ - specs/gi_spec.rb
289
+ - specs/merge_deep_spec.rb
290
+ - specs/xml_spec.rb
291
+ - specs/spec_id_spec.rb
292
+ - specs/align_spec.rb
293
+ - specs/sample_enzyme_spec.rb
294
+ - specs/spec_id_xml_spec.rb
295
+ - specs/ms/gradient_program_spec.rb
296
+ - specs/ms/msrun_spec.rb
297
+ - specs/ms/parser_spec.rb
298
+ - specs/ms/spectrum_spec.rb
299
+ - specs/validator/background_spec.rb
300
+ - specs/validator/decoy_spec.rb
301
+ - specs/validator/transmem_spec.rb
302
+ - specs/validator/true_pos_spec.rb
303
+ - specs/validator/prot_from_pep_spec.rb
304
+ - specs/validator/aa_spec.rb
305
+ - specs/validator/bias_spec.rb
306
+ - specs/transmem/toppred_spec.rb
307
+ - specs/transmem/phobius_spec.rb
308
+ - specs/spec_id/bioworks_spec.rb
309
+ - specs/spec_id/aa_freqs_spec.rb
310
+ - specs/spec_id/srf_spec.rb
311
+ - specs/spec_id/digestor_spec.rb
312
+ - specs/spec_id/protein_summary_spec.rb
313
+ - specs/spec_id/sqt_spec.rb
314
+ - specs/spec_id/precision/prob_spec.rb
315
+ - specs/spec_id/precision/filter_spec.rb
316
+ - specs/spec_id/precision/filter/cmdline_spec.rb
317
+ - specs/spec_id/precision/filter/output_spec.rb
318
+ - specs/spec_id/sequest/params_spec.rb
319
+ - specs/spec_id/sequest/pepxml_spec.rb
320
+ - specs/spec_id/proph/prot_summary_spec.rb
321
+ - specs/spec_id/proph/pep_summary_spec.rb
322
+ - specs/bin/filter_and_validate_spec.rb
323
+ - specs/bin/fasta_shaker_spec.rb
324
+ - specs/bin/bioworks_to_pepxml_spec.rb
325
+ - specs/bin/protein_summary_spec.rb
326
+ - specs/bin/ms_to_lmat_spec.rb
327
+ - specs/bin/prob_validate_spec.rb
122
328
  rdoc_options:
123
329
  - --main
124
330
  - README
@@ -132,6 +338,8 @@ executables:
132
338
  - bioworks_to_pepxml_gui.rb
133
339
  - gi2annot.rb
134
340
  - protein_summary.rb
341
+ - ms_to_lmat.rb
342
+ - aafreqs.rb
135
343
  - bioworks2excel.rb
136
344
  - pepproph_filter.rb
137
345
  - fasta_shaker.rb
@@ -139,16 +347,15 @@ executables:
139
347
  - protxml2prots_peps.rb
140
348
  - id_precision.rb
141
349
  - id_class_anal.rb
142
- - mzxml_to_lmat.rb
143
- - find_aa_freq.rb
144
- - filter.rb
350
+ - prob_validate.rb
351
+ - srf_to_sqt.rb
352
+ - filter_and_validate.rb
145
353
  - srf_group.rb
146
- - precision.rb
147
354
  - raw_to_mzXML.rb
148
355
  extensions: []
149
356
 
150
357
  requirements:
151
- - "\"xmlparser\" is the prefered xml parser right now. REXML and regular expressions are used as fallback in some routines."
358
+ - "\"libxml\" is the prefered xml parser right now. libxml, xmlparser, REXML and regular expressions are used as fallback in some routines."
152
359
  - some plotting functions will not be available without the "gnuplot" gem (and underlying gnuplot binary)
153
360
  - the "t2x" binary (in archive) or readw.exe is required to convert .RAW files to mzXML in some applications
154
361
  - "\"rake\" is useful for development"
@@ -161,5 +368,14 @@ dependencies:
161
368
  requirements:
162
369
  - - ~>
163
370
  - !ruby/object:Gem::Version
164
- version: 0.1.4
371
+ version: 0.2.5
372
+ version:
373
+ - !ruby/object:Gem::Dependency
374
+ name: axml
375
+ version_requirement:
376
+ version_requirements: !ruby/object:Gem::Version::Requirement
377
+ requirements:
378
+ - - ">"
379
+ - !ruby/object:Gem::Version
380
+ version: 0.0.0
165
381
  version:
data/bin/filter.rb DELETED
@@ -1,6 +0,0 @@
1
- #!/usr/bin/ruby -w
2
-
3
-
4
- require 'spec_id/filter'
5
-
6
- SpecID::Filter.run_from_argv(ARGV)
data/bin/precision.rb DELETED
@@ -1,5 +0,0 @@
1
- #!/usr/bin/ruby
2
-
3
- require 'spec_id'
4
-
5
- SpecID.precision(ARGV)
@@ -1,108 +0,0 @@
1
- require 'spec/msrun'
2
- require 'spec/mzdata'
3
-
4
- begin
5
- require 'xmlparser'
6
- rescue LoadError
7
- puts "*******************************************************************"
8
- puts "WARNING: 'xmlparser' library not installed:"
9
- puts "Defaulting to REXML (slower, but guaranteed to parse correct xml)"
10
- puts "Use :parse_type => 'regex' for faster (but not guaranteed) parsing"
11
- puts "Or install 'xmlparser'!"
12
- puts "*******************************************************************"
13
- end
14
- begin
15
- $XMLParserClass = XMLParser
16
- rescue NameError
17
- $XMLParserClass = Object
18
- end
19
-
20
-
21
- module Spec::MzData::PrecMzByNum; end
22
- module Spec::MzData::XMLParser; end
23
-
24
-
25
- class Spec::MzData::XMLParser::PrecMzByNum < $XMLParserClass
26
-
27
- ## This is an example from mzXML
28
- =begin
29
- @@scan_num = nil
30
- @@get_data = false
31
-
32
- attr_accessor :prec_mz
33
- def initialize
34
- @prec_mz = []
35
- end
36
-
37
- def startElement(name,attrs)
38
- if name == "scan"
39
- @@scan_num = attrs["num"].to_i
40
- elsif name == "precursorMz"
41
- @prec_mz[@@scan_num] = ""
42
- @@get_data = true
43
- end
44
- end
45
-
46
- def endElement(name)
47
- if name == "precursorMz"
48
- @@get_data = false
49
- end
50
- end
51
-
52
- def character(data)
53
- if @@get_data
54
- @prec_mz[@@scan_num] << data
55
- end
56
- end
57
- =end
58
-
59
- end
60
-
61
-
62
- class Spec::MzData::Parser
63
-
64
- def default_parser
65
- xmlparser = false
66
- $".each do |lib|
67
- if lib =~ /xmlparser/
68
- xmlparser = true
69
- end
70
- end
71
- if xmlparser
72
- return "xmlparser"
73
- else
74
- return "rexml"
75
- end
76
- end
77
-
78
-
79
- # Returns array where array[scan_num] = precursorMz
80
- # Parent scans are not arrayed
81
- # Values are strings. Array index likely starts at 1!
82
- # parse_type = "regex" | "rexml" | "xmlparser"
83
- # (only xmlparser works for now!)
84
- def precursor_mz_by_scan(file, parse_type=nil)
85
- puts "NO PARSERS AVAIALABLE YET!!"
86
- throw Exception
87
- # unless parse_type then parse_type = default_parser end
88
- # case parse_type
89
- # when "xmlparser"
90
- # ##XMLParser:
91
- # parser = Spec::MzData::XMLParser::PrecMzByNum.new
92
- # File.open(file) do |fh|
93
- # parser.parse(fh.read)
94
- # end
95
- # parser.prec_mz
96
- # when "regex"
97
- # Spec::MzData::Regexp.precursor_mz_by_scan(file)
98
- # when "rexml"
99
- # listener = Spec::MzData::REXMLStreamListener::PrecMzByNum.new
100
- # REXML::Document.parse_stream(File.new(file), listener)
101
- # listener.prec_mz
102
- # else
103
- # puts "Don't recognize parse_type: #{parse_type}"
104
- # end
105
- end
106
-
107
-
108
- end
data/lib/spec/mzdata.rb DELETED
@@ -1,48 +0,0 @@
1
-
2
- #######################################################
3
- # THIS NEEDS TO BE WORKED FOR mzdata!
4
- #######################################################
5
-
6
- require 'base64'
7
-
8
- module Spec; end
9
-
10
- module Spec::MzData
11
-
12
- ####################
13
- # THIS IS FOR mzXML right now!!!!!!!!!!!!!!!!!!!!!!!!!!!!!
14
- ####################
15
- # takes a base64 peaks string and returns an array of [m/z,intens] doublets
16
- # mzXML as network ordered
17
- def base64_peaks_to_pairs(string, precision=32)
18
- data = base64_peaks_to_array(string, precision)
19
- ndata = []
20
- data.each_with_index do |dat,ind|
21
- if (ind % 2) == 0 # even
22
- arr = Array.new(2)
23
- arr[0] = dat
24
- ndata.push( arr )
25
- else
26
- ndata.last[1] = dat
27
- end
28
- end
29
- ndata
30
- end
31
-
32
- ####################
33
- # THIS IS FOR mzXML right now!!!!!!!!!!!!!!!!!!!!!!!!!!!!!
34
- ####################
35
- # takes a base64 peaks string and returns an array of alternating m/z and
36
- # intensity mzXML as network ordered
37
- def base64_peaks_to_array(string, precision=32)
38
- b64d = Base64.decode64(string)
39
- if precision == 32
40
- unpack_code = "g*"
41
- elsif precision == 64
42
- unpack_code = "G*"
43
- end
44
- b64d.unpack(unpack_code)
45
- end
46
-
47
-
48
- end