easy_sheet_io 0.2.2 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 6de67291cc58a0ab7ea017efd79e847351f71e6790f5f2e4e3fb4462c2ff5f47
4
- data.tar.gz: aa0dca360cfa89666b291d8ddeea149399068fbf57f12c422e615c5da03ac71e
3
+ metadata.gz: ec3308eccf2e355a8c32cf0a3496425522f793633d84203fb6378b460c99b6e0
4
+ data.tar.gz: 0e00581c782acbbe52883dc0b7e298158854ac4fe992e2fc825c0c766b1f0c67
5
5
  SHA512:
6
- metadata.gz: 6cadf3040934873c1a9182000d6b90a9fbad20056e1bd0c17e2fe21929643a2a438832e4fdcdb5519b1def845925526cc3c4df460346affe397a8c05bddf95ce
7
- data.tar.gz: 3d7df3a901737bdca5ee7cf8e9399b2d958d51134328ea5ee33ac5e17126847c54ff3e20617ad26b073029afbc790e31e10bef66d18b2d74429f36db417ddef9
6
+ metadata.gz: 54a4b942475d211a2a5d6e9cd3621ed94366f6f4ea313c6eb338b9e10ee426f5bee961de91bab5d31e1b5f3cd3b84bd8636cd002af22122f5140c8303741605f
7
+ data.tar.gz: 76caa06c1a889fb1e70c6b6b2b5a8e8a483811d24380708443fc527305da8931b5c2f42728d4d82df0e426f7a48e8a992d52896ae77f9af4e7559b3fb7115b77
data/Gemfile CHANGED
@@ -6,9 +6,7 @@ source "https://rubygems.org"
6
6
  gemspec
7
7
 
8
8
  gem "rake", "~> 13.0"
9
-
10
9
  gem "rspec", "~> 3.0"
11
-
12
10
  gem "rubocop", "~> 0.80"
13
11
 
14
12
  gem "daru"
data/Gemfile.lock CHANGED
@@ -1,7 +1,15 @@
1
1
  PATH
2
2
  remote: .
3
3
  specs:
4
- easy_sheet_io (0.2.1)
4
+ easy_sheet_io (0.2.4)
5
+ daru (>= 0.3)
6
+ rake (~> 13.0)
7
+ roo-xls (>= 1.2.0)
8
+ rover-df (>= 0.2.7)
9
+ rspec (~> 3.0)
10
+ rubocop (~> 0.80)
11
+ smarter_csv (>= 1.4.2)
12
+ spreadsheet (>= 1.3.0)
5
13
 
6
14
  GEM
7
15
  remote: https://rubygems.org/
@@ -31,7 +31,15 @@ Gem::Specification.new do |spec|
31
31
 
32
32
  # Uncomment to register a new dependency of your gem
33
33
  # spec.add_dependency "example-gem", "~> 1.0"
34
-
34
+ spec.add_dependency "rake", "~> 13.0"
35
+ spec.add_dependency "rspec", "~> 3.0"
36
+ spec.add_dependency "rubocop", "~> 0.80"
37
+
38
+ spec.add_dependency "daru", ">= 0.3"
39
+ spec.add_dependency "rover-df", ">= 0.2.7"
40
+ spec.add_dependency "smarter_csv", ">= 1.4.2"
41
+ spec.add_dependency "roo-xls", ">= 1.2.0"
42
+ spec.add_dependency "spreadsheet", ">= 1.3.0"
35
43
  # For more information and examples about making a new gem, checkout our
36
44
  # guide at: https://bundler.io/guides/creating_gem.html
37
45
  end
@@ -1,5 +1,5 @@
1
1
  # frozen_string_literal: true
2
2
 
3
3
  module EasySheetIo
4
- VERSION = "0.2.2"
4
+ VERSION = "0.3.0"
5
5
  end
data/lib/easy_sheet_io.rb CHANGED
@@ -12,7 +12,7 @@ module EasySheetIo
12
12
  class Error < StandardError; end
13
13
 
14
14
  module_function
15
-
15
+
16
16
  def read(path, **opt)
17
17
  return /csv$/ === path ? read_csv(path, **opt) : read_excel(path, **opt)
18
18
  end
@@ -47,9 +47,11 @@ module EasySheetIo
47
47
  end
48
48
 
49
49
  # Convert 2d Array to Hash
50
- # ##header: nil -> Default Headers(:column1, column2,...) are generated.
51
- # line_until=nil means the data are picked up until the end line.
52
- def to_hash(array2d, line_from: 1, line_until: nil, header: 0, symbol_header: false)
50
+ ## header: nil -> Default Headers(:column1, column2,...) are generated.
51
+ ## Option line_ignored is not implemented yet.
52
+ def to_hash(array2d, line_from: 1, line_until: nil, line_ignored: nil,
53
+ header: 0, symbol_header: false,
54
+ replace_to_nil: [], analyze_type: true)
53
55
 
54
56
  # Define Read Range------------
55
57
  lfrom, luntil = line_from, line_until
@@ -65,6 +67,7 @@ module EasySheetIo
65
67
  # Define Data Array------------
66
68
  output = array2d[lfrom...luntil]
67
69
  output_transpose = output[0].zip(*output[1..])
70
+ output_transpose = fix_array(output_transpose, replace_to_nil, analyze_type)
68
71
  # -----------------------------
69
72
 
70
73
  # Define Header----------------
@@ -84,8 +87,12 @@ module EasySheetIo
84
87
  return Rover::DataFrame.new(data)
85
88
  end
86
89
  end
87
-
88
- # ##Genarate Array from excel file
90
+
91
+ #----------------------------
92
+ # Private metods from here
93
+ #----------------------------
94
+
95
+ # Genarate Array from excel file
89
96
  def open_excel(path, sheet_i, encoding: "utf-8")
90
97
  if /xlsx$/ === path
91
98
  puts "Sorry, encoding option is not supported yet for xlsx file." if encoding != "utf-8"
@@ -118,8 +125,56 @@ module EasySheetIo
118
125
  end
119
126
  end
120
127
 
128
+ # Fix Array (Replace specific values to nil, recognize value type and cast values to the type.)
129
+ def fix_array(array2d, replace_to_nil, analyze_type)
130
+ ans = array2d
131
+
132
+ ## Replace Blank or User-Selected Value
133
+ ans = ans.map do |column|
134
+ column.map { |cell| replace_to_nil.include?(cell) || /^\s*$/ === cell ? nil : cell }
135
+ end
136
+
137
+ ## Replace Number Values to Integer or Float
138
+ if analyze_type
139
+ ans = ans.map.with_index do |column, i|
140
+ type_of_column = :any
141
+ column.each { |cell| type_of_column = recognize_type(cell, type_of_column) }
142
+
143
+ # p type_of_column
144
+ case type_of_column
145
+ when :int
146
+ column.map { _1.nil? ? nil : _1.to_i }
147
+ when :float
148
+ column.map { _1.nil? ? nil : _1.to_f }
149
+ else
150
+ column
151
+ end
152
+ end
153
+ end
154
+
155
+ return ans
156
+ end
157
+
158
+ def recognize_type(str, expected)
159
+ return expected if str.nil?
160
+
161
+ order = {:any => 0, :int => 1, :float => 2, :string => 3}
162
+ if /^\s*(-|\+)?\d+\s*$/ === str
163
+ type_of_str = :int
164
+ elsif /^\s*(-|\+)?\d*\.\d*\s*$/ === str || /^\s*(-|\+)?(\d*\.\d+|\d+)(e|E)(-|\+)?\d+\s*$/ === str
165
+ type_of_str = :float
166
+ else
167
+ type_of_str = :string
168
+ end
169
+
170
+ # p "#{type_of_str}, #{str}" if order[type_of_str] > order[expected]
171
+
172
+ return order[type_of_str] > order[expected] ? type_of_str : expected
173
+ end
174
+
121
175
  # Fix blank or duplicated header
122
176
  def check_header(header_array)
177
+ # Check Blank
123
178
  ans = header_array.map.with_index do |item, i|
124
179
  if item.nil?
125
180
  "column#{i}"
@@ -130,6 +185,7 @@ module EasySheetIo
130
185
  end
131
186
  end
132
187
 
188
+ # Check Duplicated Value
133
189
  dup_check = (0...(header_array.length)).group_by {|i| ans[i]}
134
190
  dup_check.each do |item, i_s|
135
191
  if i_s.length > 1
@@ -140,4 +196,6 @@ module EasySheetIo
140
196
  return ans
141
197
  end
142
198
 
199
+ private_class_method :open_excel, :fix_array, :check_header
200
+
143
201
  end
metadata CHANGED
@@ -1,15 +1,127 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: easy_sheet_io
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.2.2
4
+ version: 0.3.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - show-o-atakun
8
8
  autorequire:
9
9
  bindir: exe
10
10
  cert_chain: []
11
- date: 2022-03-23 00:00:00.000000000 Z
12
- dependencies: []
11
+ date: 2022-03-25 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: rake
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - "~>"
18
+ - !ruby/object:Gem::Version
19
+ version: '13.0'
20
+ type: :runtime
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - "~>"
25
+ - !ruby/object:Gem::Version
26
+ version: '13.0'
27
+ - !ruby/object:Gem::Dependency
28
+ name: rspec
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - "~>"
32
+ - !ruby/object:Gem::Version
33
+ version: '3.0'
34
+ type: :runtime
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - "~>"
39
+ - !ruby/object:Gem::Version
40
+ version: '3.0'
41
+ - !ruby/object:Gem::Dependency
42
+ name: rubocop
43
+ requirement: !ruby/object:Gem::Requirement
44
+ requirements:
45
+ - - "~>"
46
+ - !ruby/object:Gem::Version
47
+ version: '0.80'
48
+ type: :runtime
49
+ prerelease: false
50
+ version_requirements: !ruby/object:Gem::Requirement
51
+ requirements:
52
+ - - "~>"
53
+ - !ruby/object:Gem::Version
54
+ version: '0.80'
55
+ - !ruby/object:Gem::Dependency
56
+ name: daru
57
+ requirement: !ruby/object:Gem::Requirement
58
+ requirements:
59
+ - - ">="
60
+ - !ruby/object:Gem::Version
61
+ version: '0.3'
62
+ type: :runtime
63
+ prerelease: false
64
+ version_requirements: !ruby/object:Gem::Requirement
65
+ requirements:
66
+ - - ">="
67
+ - !ruby/object:Gem::Version
68
+ version: '0.3'
69
+ - !ruby/object:Gem::Dependency
70
+ name: rover-df
71
+ requirement: !ruby/object:Gem::Requirement
72
+ requirements:
73
+ - - ">="
74
+ - !ruby/object:Gem::Version
75
+ version: 0.2.7
76
+ type: :runtime
77
+ prerelease: false
78
+ version_requirements: !ruby/object:Gem::Requirement
79
+ requirements:
80
+ - - ">="
81
+ - !ruby/object:Gem::Version
82
+ version: 0.2.7
83
+ - !ruby/object:Gem::Dependency
84
+ name: smarter_csv
85
+ requirement: !ruby/object:Gem::Requirement
86
+ requirements:
87
+ - - ">="
88
+ - !ruby/object:Gem::Version
89
+ version: 1.4.2
90
+ type: :runtime
91
+ prerelease: false
92
+ version_requirements: !ruby/object:Gem::Requirement
93
+ requirements:
94
+ - - ">="
95
+ - !ruby/object:Gem::Version
96
+ version: 1.4.2
97
+ - !ruby/object:Gem::Dependency
98
+ name: roo-xls
99
+ requirement: !ruby/object:Gem::Requirement
100
+ requirements:
101
+ - - ">="
102
+ - !ruby/object:Gem::Version
103
+ version: 1.2.0
104
+ type: :runtime
105
+ prerelease: false
106
+ version_requirements: !ruby/object:Gem::Requirement
107
+ requirements:
108
+ - - ">="
109
+ - !ruby/object:Gem::Version
110
+ version: 1.2.0
111
+ - !ruby/object:Gem::Dependency
112
+ name: spreadsheet
113
+ requirement: !ruby/object:Gem::Requirement
114
+ requirements:
115
+ - - ">="
116
+ - !ruby/object:Gem::Version
117
+ version: 1.3.0
118
+ type: :runtime
119
+ prerelease: false
120
+ version_requirements: !ruby/object:Gem::Requirement
121
+ requirements:
122
+ - - ">="
123
+ - !ruby/object:Gem::Version
124
+ version: 1.3.0
13
125
  description: A simple way to Open .csv, .xls, .xlsx files. You can convert it to 2D
14
126
  array, hash, data frame.
15
127
  email: