dcd 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (9) hide show
  1. checksums.yaml +7 -0
  2. data/.gitignore +9 -0
  3. data/Gemfile +1 -0
  4. data/LICENSE.txt +21 -0
  5. data/README.md +44 -0
  6. data/Rakefile +2 -0
  7. data/dcd.gemspec +20 -0
  8. data/lib/dcd.rb +225 -0
  9. metadata +79 -0
@@ -0,0 +1,7 @@
1
+ ---
2
+ SHA1:
3
+ metadata.gz: a042ccc8e4a657dec774f8aef387bca1e6d9bb91
4
+ data.tar.gz: 2f9be85b8c3ac648567f6313308a89e369b85e35
5
+ SHA512:
6
+ metadata.gz: c281f10fbbeb7ed570212f4accb0775766fb98dff1479273b50771554ad68c9404b0e9a7c440d783e3bb5686ee989873f71803978ff221c3d4e1482fe12c778b
7
+ data.tar.gz: 37a27f524072ed45e048a254ba0d531d74e1709fb5a7380499a7a355fc1be4d7d59fea63e8837e20454b2c28b3bf6df1b6565557abb58642b5f3ca4c10d693d8
@@ -0,0 +1,9 @@
1
+ /.bundle/
2
+ /.yardoc
3
+ /Gemfile.lock
4
+ /_yardoc/
5
+ /coverage/
6
+ /doc/
7
+ /pkg/
8
+ /spec/reports/
9
+ /tmp/
data/Gemfile ADDED
@@ -0,0 +1 @@
1
+ source 'https://rubygems.org'
@@ -0,0 +1,21 @@
1
+ The MIT License (MIT)
2
+
3
+ Copyright (c) 2016 Joshua Smock
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in
13
+ all copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
21
+ THE SOFTWARE.
@@ -0,0 +1,44 @@
1
+ # DCD
2
+
3
+ DCD is a Ruby library for processing CHARMM and X-PLOR style binary trajectory files, aka DCD files. Based on the [`matdcd`](http://www.ks.uiuc.edu/Development/MDTools/matdcd/) and [VMD DCD plugin](http://www.ks.uiuc.edu/Research/vmd/plugins/doxygen/dcdplugin_8c-source.html), DCD parses and allows access to various metadata and atom information for use in scripts and automated environments where the numeric positions of the atoms is useful.
4
+
5
+ ## Installation
6
+
7
+ Add this line to your application's Gemfile:
8
+
9
+ gem 'dcd'
10
+
11
+ And then execute:
12
+
13
+ $ bundle
14
+
15
+ Or install it yourself as:
16
+
17
+ $ gem install dcd
18
+
19
+
20
+ ## Usage
21
+
22
+ DCD requires an io pointer to a binary DCD file upon initialization, and can be used in two ways: instant loading and lazy loading. The difference between instant and lazy loading is passing in an optional second argument upon initialization.
23
+
24
+ ```ruby
25
+ > require('dcd')
26
+ => true
27
+ > dcd_pointer = File.read('1407.dcd')
28
+ => #<File:./1407.dcd>
29
+ > lazy_load = false
30
+ => false
31
+ > my_dcd = DCD.new(dcd_pointer, lazy_load)
32
+ => ...
33
+ ```
34
+
35
+ Once loaded, you have access to the metadata, including the `nstep`, `nset`, and `step`, the title, and the frames with atom coordinates in `x`, `y`, `z`, and `w` if using a 4th dimensional DCD.
36
+
37
+ ## TODO
38
+
39
+ 1. Currently test coverage on this library is limited, especially around fixed atoms and CHARMM 4th dimensional parameters. If you DCDs, especially those with the aforementioned features, please make a pull request or an issue with the necessary files attached.
40
+ 2. Examples.
41
+
42
+ ## License
43
+
44
+ MIT. See LICENSE for more information.
@@ -0,0 +1,2 @@
1
+ require "bundler/gem_tasks"
2
+ task :default => :spec
@@ -0,0 +1,20 @@
1
+ # coding: utf-8
2
+ lib = File.expand_path('../lib', __FILE__)
3
+ $LOAD_PATH.unshift(lib) unless $LOAD_PATH.include?(lib)
4
+
5
+ Gem::Specification.new do |spec|
6
+ spec.name = "dcd"
7
+ spec.version = "0.0.1"
8
+ spec.authors = ["Joshua Smock"]
9
+ spec.email = ["joshuasmock@gmail.com"]
10
+
11
+ spec.summary = %q{DCD is a simple parser for CHARMM and X-PLOR binary trajectory files}
12
+ spec.homepage = "https://github.com/jo-sm/dcd"
13
+ spec.license = "MIT"
14
+
15
+ spec.files = `git ls-files -z`.split("\x0").reject { |f| f.match(%r{^(test|spec|features)/}) }
16
+ spec.require_paths = ["lib"]
17
+
18
+ spec.add_development_dependency "bundler", "~> 1.12.a"
19
+ spec.add_development_dependency "rake", "~> 10.0"
20
+ end
@@ -0,0 +1,225 @@
1
+ class DCD
2
+ attr_reader :metadata, :title, :frames
3
+
4
+ def initialize(io, lazy=false)
5
+ @io_pointer = io
6
+ @read_length = 0
7
+ @type = ''
8
+ @endian = ''
9
+ @title = ''
10
+ @metadata = {}
11
+ @frames = {}
12
+ @valid = true
13
+
14
+ if !lazy
15
+ read_header
16
+ read_atoms
17
+ end
18
+ end
19
+
20
+ # Loads the header, which determines endianness
21
+ # and the initial metadata about the DCD file
22
+ def read_header
23
+ determine_endianness
24
+ gather_metadata
25
+ read_title
26
+ read_atoms_metadata
27
+ end
28
+
29
+ def read_atoms
30
+ @frames[:x], @frames[:y], @frames[:z], @frames[:w] = [], [], [], []
31
+
32
+ @metadata[:nset].times do |i|
33
+ if @metadata[:extrablock]
34
+ # Unit cell info
35
+ i = @io_pointer.read(@read_length + 48 + @read_length).unpack("L#{endian}*")[0]
36
+ warn "Incorrect frame size in unit cell for step #{i}" if i[0] != i[-1]
37
+ # TODO: Process this data
38
+ end
39
+
40
+ # Treat first frame and fixed atoms DCD files differently
41
+ if i == 0 or @metadata[:num_fixed] == 0
42
+ # Read each frame
43
+ read_coord(:x)
44
+ read_coord(:y)
45
+ read_coord(:z)
46
+ read_coord(:w) if @metadata[:w_coords]
47
+ else
48
+ read_fixed_coord(:x)
49
+ read_fixed_coord(:y)
50
+ read_fixed_coord(:z)
51
+ read_coord(:w) if @metadata[:w_coords]
52
+ end
53
+ end
54
+ end
55
+
56
+ def print
57
+ if @title == '' or !@frames[:x]
58
+ warn "DCD has not been processed"
59
+ return nil
60
+ end
61
+
62
+ puts "#{@metadata[:is_charmm] ? 'CHARMM' : 'X-PLOR'} #{@type == 'l' ? '32' : '64'}-bit Trajectory File #{@endian == '>' ? 'Big' : 'Little'} Endian"
63
+ puts "#{@title}"
64
+ puts "Nset: #{@metadata[:nset]}"
65
+ puts "Istart: #{@metadata[:istart]}"
66
+ puts "Nsavc: #{@metadata[:nsavc]}"
67
+ puts "Nstep: #{@metadata[:nstep]}"
68
+ puts "Step size: #{@metadata[:step]} picoseconds"
69
+ puts "Number of atoms per frame: #{@metadata[:num_atoms]}"
70
+ @frames[:x].each_with_index do |coords, i|
71
+ puts "Frame #{i} coordinates"
72
+ coords.each_with_index do |coord, j|
73
+ puts "(#{j})\t\t\t#{@frames[:x][i][j]}\t\t#{@frames[:y][i][j]}\t\t#{@frames[:z][i][j]}"
74
+ end
75
+ end
76
+ end
77
+
78
+ private
79
+
80
+ def read_coord(coord)
81
+ coord_block_size = @io_pointer.read(@read_length).unpack("#{@type}#{@endian}")[0]
82
+ @frames[coord].push(@io_pointer.read(coord_block_size).unpack('f*'))
83
+ coord_check = @io_pointer.read(@read_length).unpack("#{@type}#{@endian}")[0]
84
+
85
+ warn "Invalid block size for #{coord} coords" if coord_block_size != coord_check
86
+ end
87
+
88
+ def read_fixed_coord(coord)
89
+ num_free = @metadata[:num_atoms] - @metadata[:num_fixed]
90
+
91
+ # Fixed atom coordinates are 4 bytes in length,
92
+ # and there are `num_free` amount of coordinates per block
93
+ fixed_coord_block_size = @io_pointer.read(@read_length).unpack("#{@type}#{@endian}")[0]
94
+ free_atom_coords = @io_pointer.read(4 * num_free).unpack('f*')
95
+ fixed_coord_check = @io_pointer.read(@read_length).unpack("#{@type}#{@endian}")[0]
96
+
97
+ raise StandardError, "Invalid DCD, fixed coordinate check did not match" if fixed_coord_block_size != fixed_coord_check
98
+
99
+ # Now, a copy of the first frame is made and the trajectory changes are overwritten
100
+ # with the free atom coordinates
101
+ new_coords = @coord[coord][0].clone
102
+
103
+ num_free.times do |i|
104
+ new_coords[@metadata[:free_indexes][i]] = free_atom_coords[i]
105
+ end
106
+
107
+ @coord[coord].push(new_coords)
108
+ end
109
+
110
+ # Determines endianness of DCD file
111
+ def determine_endianness
112
+ # Ensure that the pointer is as position 0
113
+ @io_pointer.seek(0)
114
+ initial_data = @io_pointer.read(4)
115
+
116
+ # Default to 32 bit for these values
117
+ @read_length = 4
118
+ @type = 'l'
119
+
120
+ # Determine if DCD file is 32 bit or 64 bit
121
+ puts initial_data.unpack('L>'), initial_data.unpack('L<')
122
+ if initial_data.unpack('L>')[0] == 84
123
+ # Big endian
124
+ @endian = '>'
125
+ elsif initial_data.unpack('L<')[0] == 84
126
+ # Little endian
127
+ @endian = '<'
128
+ end
129
+
130
+ puts @endian, @type
131
+
132
+ # If the endianness is not set, then the DCD file is 64 bit
133
+ if @endian == ''
134
+ @type = 'q'
135
+
136
+ second_byte = @io_pointer.read(4)
137
+ initial_data = initial_data + second_byte
138
+
139
+ @read_length = 8
140
+
141
+ if initial_data.unpack('q>')[0] == 84
142
+ @endian = '>'
143
+ elsif initial_data.unpack('q<')[0] == 84
144
+ @endian = '<'
145
+ end
146
+ end
147
+
148
+ if @endian == ''
149
+ @valid = false
150
+ raise StandardError, "Invalid DCD file"
151
+ end
152
+
153
+ if @io_pointer.read(4) != 'CORD'
154
+ @valid = false
155
+ raise StandardError, "Invalid DCD file"
156
+ end
157
+ end
158
+
159
+ # Gathers metadata, including if file is CHARMM format,
160
+ def gather_metadata
161
+ @io_pointer.seek(@read_length + 4)
162
+ metadata_raw = @io_pointer.read(80)
163
+
164
+ # The next @read_length amount of data when unpacked should equal 84
165
+ check = @io_pointer.read(@read_length).unpack("#{@type}#{@endian}")[0]
166
+ raise StandardError, "Invalid DCD format, expected 84 but saw #{check}" if check != 84
167
+
168
+ unpacked_meta = metadata_raw.unpack("L#{@endian}9a4L#{@endian}*")
169
+
170
+ @metadata[:is_charmm] = unpacked_meta[-1] != 0 # 76 - 79
171
+ @metadata[:nset] = unpacked_meta[0] # 0-3
172
+ @metadata[:istart] = unpacked_meta[1] # 4-7
173
+ @metadata[:nsavc] = unpacked_meta[2] # 8-11
174
+ @metadata[:nstep] = unpacked_meta[3] # 12-15 # not present in XPLOR files - is 0
175
+ # unpacked_meta[4] - unpacked_meta[7] are zeros
176
+ @metadata[:num_fixed] = unpacked_meta[8] # 32 - 35
177
+ @metadata[:step_size] = unpacked_meta[9].unpack(@metadata[:is_charmm] ? (@endian == '>' ? 'g' : 'e') : (@endian == '>' ? 'G' : 'E'))[0] # 36 - 39
178
+ @metadata[:charmm_extrablock] = unpacked_meta[10] != 0 # 40 - 43
179
+ @metadata[:w_coords] = unpacked_meta[11] == 1 # 44 - 47
180
+ end
181
+
182
+ def read_title
183
+ @io_pointer.seek(@read_length + 80 + 4 + @read_length)
184
+ title_metadata = @io_pointer.read(@read_length*2).unpack("#{@type}#{@endian}2")
185
+
186
+ size = title_metadata[0]
187
+ num_lines = title_metadata[1]
188
+
189
+ puts size, num_lines
190
+
191
+ # VMD's plugin notes: There are certain programs such as Vega ZZ that write an incorrect DCD file header. Check for these
192
+ if num_lines < 0
193
+ raise StandardError, "Invalid DCD file, negative title length"
194
+ elsif num_lines > 1000
195
+ num_lines = 0
196
+ num_lines = 2 if num_lines == 1095062083 # Vega ZZ
197
+ warn "Invalid title length, setting to #{num_lines}. May result in invalid subsequent IO reads"
198
+ end
199
+
200
+ title_data = @io_pointer.read(num_lines*80 + @read_length*3).unpack("a#{num_lines*80}#{@type}#{@endian}2l#{@endian}")
201
+ @title = title_data[0]
202
+ size_check = title_data[1]
203
+
204
+ raise StandardError, "Invalid DCD format, size mismatch" if size != size_check
205
+ raise StandardError, "Invalid DCD format, invalid check" if title_data[2] != 4
206
+ end
207
+
208
+ # This method does not know where to read, since the title can be variable length
209
+ # So this must be called after .read_title
210
+ def read_atoms_metadata
211
+ @metadata[:num_atoms] = @io_pointer.read(@read_length).unpack("#{@type}#{@endian}")[0]
212
+
213
+ if @metadata[:num_fixed] != 0
214
+ num_free_data = @io_pointer.read(@read_length + @metadata[:num_atoms] - @metadata[:num_fixed]).unpack("L#{@endian}*")
215
+
216
+ num_free = num_free_data[0]
217
+ @metadata[:free_indexes] = num_free_data[1..-2]
218
+ num_free_check = num_free_data[-1]
219
+
220
+ raise StandardError, "Invalid DCD format, fixed atoms check failed" if num_free != num_free_check
221
+ end
222
+
223
+ @metadata[:body_start] = @io_pointer.pos
224
+ end
225
+ end
metadata ADDED
@@ -0,0 +1,79 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: dcd
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.0.1
5
+ platform: ruby
6
+ authors:
7
+ - Joshua Smock
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2016-04-06 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: bundler
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - "~>"
18
+ - !ruby/object:Gem::Version
19
+ version: 1.12.a
20
+ type: :development
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - "~>"
25
+ - !ruby/object:Gem::Version
26
+ version: 1.12.a
27
+ - !ruby/object:Gem::Dependency
28
+ name: rake
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - "~>"
32
+ - !ruby/object:Gem::Version
33
+ version: '10.0'
34
+ type: :development
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - "~>"
39
+ - !ruby/object:Gem::Version
40
+ version: '10.0'
41
+ description:
42
+ email:
43
+ - joshuasmock@gmail.com
44
+ executables: []
45
+ extensions: []
46
+ extra_rdoc_files: []
47
+ files:
48
+ - ".gitignore"
49
+ - Gemfile
50
+ - LICENSE.txt
51
+ - README.md
52
+ - Rakefile
53
+ - dcd.gemspec
54
+ - lib/dcd.rb
55
+ homepage: https://github.com/jo-sm/dcd
56
+ licenses:
57
+ - MIT
58
+ metadata: {}
59
+ post_install_message:
60
+ rdoc_options: []
61
+ require_paths:
62
+ - lib
63
+ required_ruby_version: !ruby/object:Gem::Requirement
64
+ requirements:
65
+ - - ">="
66
+ - !ruby/object:Gem::Version
67
+ version: '0'
68
+ required_rubygems_version: !ruby/object:Gem::Requirement
69
+ requirements:
70
+ - - ">="
71
+ - !ruby/object:Gem::Version
72
+ version: '0'
73
+ requirements: []
74
+ rubyforge_project:
75
+ rubygems_version: 2.2.5
76
+ signing_key:
77
+ specification_version: 4
78
+ summary: DCD is a simple parser for CHARMM and X-PLOR binary trajectory files
79
+ test_files: []