transform_xlsx 0.0.1

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml ADDED
@@ -0,0 +1,15 @@
1
+ ---
2
+ !binary "U0hBMQ==":
3
+ metadata.gz: !binary |-
4
+ ZTIxYTdjNzZiNmYzZDVlNWY4NzJhMTFjZjkzNzVkZTc5MGI5Y2YwMw==
5
+ data.tar.gz: !binary |-
6
+ OTg0M2VjNGMwM2M4Zjc5Nzc5MTBkM2JjNmJmNDE3MDNmY2Y4ZDM5MQ==
7
+ SHA512:
8
+ metadata.gz: !binary |-
9
+ MTEyZjdmZTNjNGQwY2M2YmNhYjg4MWZmZWZiZTNkNzliM2U2OTM0YjdkM2Y4
10
+ OThkMjA4N2VjOTYzNTc1ZjhmMWQwOTQ1ZDVjMjMzZTJjOThjZDg5ZjkyOWIw
11
+ ZDk2NjJlM2RhYjMwNGZiZDA4NDVmYjY2ZGM5YTZkOWEwNGRjYWE=
12
+ data.tar.gz: !binary |-
13
+ N2JiNGJiMzE3YWY5MjZjMzcxYmQ0YWUxZmM4NjkyZWQ5MDcxMjlkNTg1ZjM0
14
+ Y2VlNDQ4NmJlZmU2M2E1YmJlZTlkNzdhMTE5OWVkYmFkN2NkNTA3ZDU5YWFk
15
+ NzhiNjY2NDc5OGNhODVhNDVkZGI4Yzc0YmY3MDVkMjc2MjJhOTY=
data/.gitignore ADDED
@@ -0,0 +1,17 @@
1
+ *.gem
2
+ *.rbc
3
+ .bundle
4
+ .config
5
+ .yardoc
6
+ Gemfile.lock
7
+ InstalledFiles
8
+ _yardoc
9
+ coverage
10
+ doc/
11
+ lib/bundler/man
12
+ pkg
13
+ rdoc
14
+ spec/reports
15
+ test/tmp
16
+ test/version_tmp
17
+ tmp
data/Gemfile ADDED
@@ -0,0 +1,4 @@
1
+ source 'https://rubygems.org'
2
+
3
+ # Specify your gem's dependencies in transform_xlsx.gemspec
4
+ gemspec
data/LICENSE.txt ADDED
@@ -0,0 +1,22 @@
1
+ Copyright (c) 2015 Prathiba Kn
2
+
3
+ MIT License
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining
6
+ a copy of this software and associated documentation files (the
7
+ "Software"), to deal in the Software without restriction, including
8
+ without limitation the rights to use, copy, modify, merge, publish,
9
+ distribute, sublicense, and/or sell copies of the Software, and to
10
+ permit persons to whom the Software is furnished to do so, subject to
11
+ the following conditions:
12
+
13
+ The above copyright notice and this permission notice shall be
14
+ included in all copies or substantial portions of the Software.
15
+
16
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
17
+ EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
18
+ MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
19
+ NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
20
+ LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
21
+ OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
22
+ WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
data/README.md ADDED
@@ -0,0 +1,46 @@
1
+ # TransformXlsx
2
+
3
+ TransformXlsx - Complex Excel input to Organised output in simple data structures.
4
+ This gem can be used to parse relationwise complex excel sheets.
5
+ The idea is to provide memory efficient and quick way to parse huge excel sheets.
6
+
7
+ ## Installation
8
+
9
+ Add this line to your application's Gemfile:
10
+
11
+ gem 'transform_xlsx'
12
+
13
+ And then execute:
14
+
15
+ $ bundle
16
+
17
+ Or install it yourself as:
18
+
19
+ $ gem install transform_xlsx
20
+
21
+ ## Usage
22
+ For parsing xlsx files with XxY kind of 2Dimensional data,
23
+
24
+ convert = TransformXlsx::TwoDimensional.new(file_path, sheet_number, start_row_number)
25
+
26
+ convert.to_hash
27
+ convert.to_json
28
+
29
+ For parsing xlsx files with 1Dimensional table data,
30
+
31
+
32
+ convert = TransformXlsx::SingleDimensional.new(file_path, sheet_number, start_row_number)
33
+
34
+ convert.to_hash
35
+ convert.to_json
36
+
37
+ Coming Soon:
38
+ Parsing hierarchical data
39
+
40
+ ## Contributing
41
+
42
+ 1. Fork it
43
+ 2. Create your feature branch (`git checkout -b my-new-feature`)
44
+ 3. Commit your changes (`git commit -am 'Add some feature'`)
45
+ 4. Push to the branch (`git push origin my-new-feature`)
46
+ 5. Create new Pull Request
data/Rakefile ADDED
@@ -0,0 +1,10 @@
1
+ require 'rspec/core/rake_task'
2
+ require 'bundler/gem_tasks'
3
+
4
+ # Default directory to look in is `/specs`
5
+ # Run with `rake spec`
6
+ RSpec::Core::RakeTask.new(:spec) do |task|
7
+ task.rspec_opts = ['--color', '--format', 'nested']
8
+ end
9
+
10
+ task :default => :spec
@@ -0,0 +1,8 @@
1
+ require "transform_xlsx/version"
2
+ require "transform_xlsx/data_type"
3
+ require "transform_xlsx/single_dimensional"
4
+ require "transform_xlsx/two_dimensional"
5
+
6
+ module TransformXlsx
7
+ # Your code goes here...
8
+ end
@@ -0,0 +1,38 @@
1
+ require 'roo'
2
+ require 'json'
3
+
4
+ class DataType
5
+ attr_accessor :start_row, :data
6
+ def initialize file_path, sheet_number, start_row
7
+ @start_row = start_row
8
+ file = Roo::Excelx.new(file_path)
9
+ @data = Hash.new
10
+
11
+ sheet_name = file.sheets[sheet_number]
12
+ validate_input(file, sheet_name, start_row)
13
+ @data[sheet_name] = file.to_a
14
+ end
15
+
16
+ def validate_input(file, sheet_name, start_row)
17
+ if sheet_name.nil?
18
+ raise "Sheet number #{sheet_number} not found"
19
+ end
20
+ file.default_sheet = sheet_name
21
+
22
+ if file.first_row != start_row
23
+ raise "No column data at start row - #{start_row}"
24
+ end
25
+ end
26
+
27
+ def process_data
28
+ end
29
+
30
+ def to_hash
31
+ process_data
32
+ end
33
+
34
+ def to_json
35
+ to_hash.to_json
36
+ end
37
+
38
+ end
@@ -0,0 +1,18 @@
1
+ #require 'data_type'
2
+ module TransformXlsx
3
+ class SingleDimensional < DataType
4
+
5
+ # hash[sheet_name] = [[col1,col2,col3], [val1,val2,val3], [val1,val2,val3]]
6
+
7
+ #Go through each row and set first element in row as column, and rest of elements as values corresponding
8
+ # to each element in first row . data(r,c) = value
9
+ def initialize file_path, sheet_number, start_row
10
+ super(file_path, sheet_number, start_row)
11
+ end
12
+
13
+ def process_data
14
+ @data
15
+ end
16
+
17
+ end
18
+ end
@@ -0,0 +1,38 @@
1
+ #require 'data_type'
2
+ module TransformXlsx
3
+ class TwoDimensional < DataType
4
+
5
+ # hash[sheet_name] = {:period1 => {:m1 => value, :m2 => value}}
6
+
7
+ #Go through each row and set first element in row as column, and rest of elements as values corresponding
8
+ # to each element in first row . data(r,c) = value
9
+ def initialize file_path, sheet_number, start_row
10
+ super( file_path, sheet_number, start_row)
11
+ end
12
+
13
+ def process_data
14
+ hashed = Hash.new
15
+ sheet = nil
16
+ @data.each do |sheet_name, sheet|
17
+ hashed[sheet_name] = {}
18
+ columns = sheet[@start_row - 1].compact
19
+ columns.each do |key|
20
+ hashed[sheet_name][key] = {}
21
+ end
22
+ #exclude first row(columns) from further processing
23
+ sheet.each_with_index do |row, idx|
24
+ if (row.compact != [] and idx != 0)
25
+ key1 = row.compact.first
26
+ row.each_with_index do |v,i|
27
+ if i != 0
28
+ hashed[sheet_name][columns[i-1]].merge!({key1 => v})
29
+ end
30
+ end
31
+ end
32
+ end
33
+ end
34
+ hashed
35
+ end
36
+ end
37
+ end
38
+
@@ -0,0 +1,3 @@
1
+ module TransformXlsx
2
+ VERSION = "0.0.1"
3
+ end
Binary file
Binary file
@@ -0,0 +1 @@
1
+
@@ -0,0 +1,2 @@
1
+ $LOAD_PATH.unshift File.expand_path('../../lib', __FILE__)
2
+ require 'transform_xlsx'
@@ -0,0 +1,23 @@
1
+ require 'spec_helper'
2
+ describe "TwoDimensional" do
3
+ before(:all) do
4
+ @convert = TransformXlsx::TwoDimensional.new("spec/fixtures/Workbook1.xlsx", 1, 1)
5
+ end
6
+ it "should trasform the the excel given sheet number and start row to a Hash object" do
7
+ hash_result = {"Sheet2"=>{"p1"=>{"metric 1"=>1.0, "m2"=>6.0, "m3"=>23.0, "m4"=>56.0, "m5"=>56.0, "m6"=>4.0, "m7"=>3.0, "m8"=>345.0, "m9"=>76.0}, "p2"=>{"metric 1"=>2.0, "m2"=>7.0, "m3"=>345.0, "m4"=>234.0, "m5"=>3.0, "m6"=>345.0, "m7"=>35.0, "m8"=>nil, "m9"=>345.0}, "p3"=>{"metric 1"=>3.0, "m2"=>8.0, "m3"=>6.0, "m4"=>234.0, "m5"=>nil, "m6"=>676.0, "m7"=>678.0, "m8"=>345.0, "m9"=>34.0}, "p4"=>{"metric 1"=>4.0, "m2"=>9.0, "m3"=>4.0, "m4"=>234.0, "m5"=>2.0, "m6"=>567.0, "m7"=>567.0, "m8"=>45.0, "m9"=>45.0}, "p5"=>{"metric 1"=>5.0, "m2"=>0.0, "m3"=>34.0, "m4"=>234.0, "m5"=>2.0, "m6"=>567.0, "m7"=>345.0, "m8"=>567.0, "m9"=>56.0}, "p6"=>{"metric 1"=>6.0, "m2"=>-5.0, "m3"=>234.0, "m4"=>234.0, "m5"=>2.0, "m6"=>34.0, "m7"=>567.0, "m8"=>567.0, "m9"=>55.0}}}
8
+ @convert.to_hash.should eql hash_result
9
+ end
10
+
11
+ it "should trasform the the excel given sheet number and start row to a JSON object" do
12
+ json_result = "{\"Sheet2\":{\"p1\":{\"metric 1\":1.0,\"m2\":6.0,\"m3\":23.0,\"m4\":56.0,\"m5\":56.0,\"m6\":4.0,\"m7\":3.0,\"m8\":345.0,\"m9\":76.0},\"p2\":{\"metric 1\":2.0,\"m2\":7.0,\"m3\":345.0,\"m4\":234.0,\"m5\":3.0,\"m6\":345.0,\"m7\":35.0,\"m8\":null,\"m9\":345.0},\"p3\":{\"metric 1\":3.0,\"m2\":8.0,\"m3\":6.0,\"m4\":234.0,\"m5\":null,\"m6\":676.0,\"m7\":678.0,\"m8\":345.0,\"m9\":34.0},\"p4\":{\"metric 1\":4.0,\"m2\":9.0,\"m3\":4.0,\"m4\":234.0,\"m5\":2.0,\"m6\":567.0,\"m7\":567.0,\"m8\":45.0,\"m9\":45.0},\"p5\":{\"metric 1\":5.0,\"m2\":0.0,\"m3\":34.0,\"m4\":234.0,\"m5\":2.0,\"m6\":567.0,\"m7\":345.0,\"m8\":567.0,\"m9\":56.0},\"p6\":{\"metric 1\":6.0,\"m2\":-5.0,\"m3\":234.0,\"m4\":234.0,\"m5\":2.0,\"m6\":34.0,\"m7\":567.0,\"m8\":567.0,\"m9\":55.0}}}"
13
+ @convert.to_json.should eql json_result
14
+ end
15
+
16
+ it "should raise error if sheet number does not exist" do
17
+ lambda{convert = TransformXlsx::TwoDimensional.new("spec/fixtures/Workbook1.xlsx", 100, 1)}.should raise_error
18
+ end
19
+
20
+ it "should raise error if the start row does not contain data" do
21
+ lambda{convert = TransformXlsx::TwoDimensional.new("spec/fixtures/Workbook1.xlsx", 1, 10)}.should raise_error
22
+ end
23
+ end
@@ -0,0 +1,26 @@
1
+ # coding: utf-8
2
+ lib = File.expand_path('../lib', __FILE__)
3
+ $LOAD_PATH.unshift(lib) unless $LOAD_PATH.include?(lib)
4
+ require 'transform_xlsx/version'
5
+
6
+ Gem::Specification.new do |spec|
7
+ spec.name = "transform_xlsx"
8
+ spec.version = TransformXlsx::VERSION
9
+ spec.authors = ["Prathiba Kn"]
10
+ spec.email = ["prathiba_kn@gmail.com"]
11
+ spec.description = %q{Transforms Excelx file into Hash Or Json objects}
12
+ spec.summary = %q{Transforms 1D and 2D excelx file into Hash or Json objects}
13
+ spec.homepage = ""
14
+ spec.license = "MIT"
15
+
16
+ spec.files = `git ls-files`.split($/)
17
+ spec.executables = spec.files.grep(%r{^bin/}) { |f| File.basename(f) }
18
+ spec.test_files = spec.files.grep(%r{^(test|spec|features)/})
19
+ spec.require_paths = ["lib"]
20
+
21
+ spec.add_development_dependency "bundler", "~> 1.3"
22
+ spec.add_development_dependency "rake"
23
+ spec.add_development_dependency "rspec"
24
+ spec.add_dependency "roo"
25
+ spec.add_dependency "json"
26
+ end
metadata ADDED
@@ -0,0 +1,135 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: transform_xlsx
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.0.1
5
+ platform: ruby
6
+ authors:
7
+ - Prathiba Kn
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2015-07-14 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: bundler
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - ~>
18
+ - !ruby/object:Gem::Version
19
+ version: '1.3'
20
+ type: :development
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - ~>
25
+ - !ruby/object:Gem::Version
26
+ version: '1.3'
27
+ - !ruby/object:Gem::Dependency
28
+ name: rake
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - ! '>='
32
+ - !ruby/object:Gem::Version
33
+ version: '0'
34
+ type: :development
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - ! '>='
39
+ - !ruby/object:Gem::Version
40
+ version: '0'
41
+ - !ruby/object:Gem::Dependency
42
+ name: rspec
43
+ requirement: !ruby/object:Gem::Requirement
44
+ requirements:
45
+ - - ! '>='
46
+ - !ruby/object:Gem::Version
47
+ version: '0'
48
+ type: :development
49
+ prerelease: false
50
+ version_requirements: !ruby/object:Gem::Requirement
51
+ requirements:
52
+ - - ! '>='
53
+ - !ruby/object:Gem::Version
54
+ version: '0'
55
+ - !ruby/object:Gem::Dependency
56
+ name: roo
57
+ requirement: !ruby/object:Gem::Requirement
58
+ requirements:
59
+ - - ! '>='
60
+ - !ruby/object:Gem::Version
61
+ version: '0'
62
+ type: :runtime
63
+ prerelease: false
64
+ version_requirements: !ruby/object:Gem::Requirement
65
+ requirements:
66
+ - - ! '>='
67
+ - !ruby/object:Gem::Version
68
+ version: '0'
69
+ - !ruby/object:Gem::Dependency
70
+ name: json
71
+ requirement: !ruby/object:Gem::Requirement
72
+ requirements:
73
+ - - ! '>='
74
+ - !ruby/object:Gem::Version
75
+ version: '0'
76
+ type: :runtime
77
+ prerelease: false
78
+ version_requirements: !ruby/object:Gem::Requirement
79
+ requirements:
80
+ - - ! '>='
81
+ - !ruby/object:Gem::Version
82
+ version: '0'
83
+ description: Transforms Excelx file into Hash Or Json objects
84
+ email:
85
+ - prathiba_kn@gmail.com
86
+ executables: []
87
+ extensions: []
88
+ extra_rdoc_files: []
89
+ files:
90
+ - .gitignore
91
+ - Gemfile
92
+ - LICENSE.txt
93
+ - README.md
94
+ - Rakefile
95
+ - lib/transform_xlsx.rb
96
+ - lib/transform_xlsx/data_type.rb
97
+ - lib/transform_xlsx/single_dimensional.rb
98
+ - lib/transform_xlsx/two_dimensional.rb
99
+ - lib/transform_xlsx/version.rb
100
+ - spec/fixtures/Workbook1.xlsx
101
+ - spec/fixtures/new.xlsx
102
+ - spec/single_dimensional_spec.rb
103
+ - spec/spec_helper.rb
104
+ - spec/two_dimensional_spec.rb
105
+ - transform_xlsx.gemspec
106
+ homepage: ''
107
+ licenses:
108
+ - MIT
109
+ metadata: {}
110
+ post_install_message:
111
+ rdoc_options: []
112
+ require_paths:
113
+ - lib
114
+ required_ruby_version: !ruby/object:Gem::Requirement
115
+ requirements:
116
+ - - ! '>='
117
+ - !ruby/object:Gem::Version
118
+ version: '0'
119
+ required_rubygems_version: !ruby/object:Gem::Requirement
120
+ requirements:
121
+ - - ! '>='
122
+ - !ruby/object:Gem::Version
123
+ version: '0'
124
+ requirements: []
125
+ rubyforge_project:
126
+ rubygems_version: 2.4.6
127
+ signing_key:
128
+ specification_version: 4
129
+ summary: Transforms 1D and 2D excelx file into Hash or Json objects
130
+ test_files:
131
+ - spec/fixtures/Workbook1.xlsx
132
+ - spec/fixtures/new.xlsx
133
+ - spec/single_dimensional_spec.rb
134
+ - spec/spec_helper.rb
135
+ - spec/two_dimensional_spec.rb