officex2str 0.0.9 → 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,7 @@
1
+ ---
2
+ SHA1:
3
+ metadata.gz: 7e56e217a644021b0cbc911758ff81e3e3a5902f
4
+ data.tar.gz: cac9cc64a9741e37d90b19114dc36f44a7cee8ac
5
+ SHA512:
6
+ metadata.gz: 40aee55eff82441f5093c3c23fa681ec2b2d3016c7f5ce3744139793dfd0769c324e1f6bef28ae29acdd3fbddebfdf6b1ffdc7e941a6b27854b17b22fed4e36d
7
+ data.tar.gz: e8596c262b56057fb3c0542fe8537af139c8bc36724ee72ffb653bd16b419a3817c11fa59203463086491e2acabcf5878e3050648b979c964d41dafc81b4f564
@@ -25,8 +25,14 @@ class Officex2str
25
25
 
26
26
  def convert
27
27
  if valid_file?
28
- extract_xmls
29
- xml_to_str
28
+ text = []
29
+ select_target_entries.each do |entry|
30
+ doc = Nokogiri.XML(entry.get_input_stream.read, nil, 'utf8')
31
+ # XLSXではrPhタグに漢字のフリガナが自動的に挿入されるため除外
32
+ doc.css('rPh').remove
33
+ text << doc.to_str
34
+ end
35
+ text.join(' ')
30
36
  else
31
37
  raise InvalidFileTypeError, "Not recognized file type"
32
38
  end
@@ -50,12 +56,4 @@ private
50
56
  end
51
57
  end
52
58
 
53
- def extract_xmls
54
- select_target_entries.map{|entry| xmls << entry.get_input_stream.read }
55
- end
56
-
57
- def xml_to_str
58
- return '' if xmls.empty?
59
- xmls.inject(""){|result, xml| result << Nokogiri.XML(xml, nil, 'utf8').to_str }
60
- end
61
59
  end
@@ -1,3 +1,3 @@
1
1
  class Officex2str
2
- VERSION = "0.0.9"
2
+ VERSION = "0.1.0"
3
3
  end
@@ -60,6 +60,10 @@ describe Officex2str do
60
60
  subject.should include("STG003")
61
61
  subject.should_not include("sonicgarden")
62
62
  subject.should_not include("sheet")
63
+ # フリガナの自動保存分除去確認
64
+ subject.should_not include('カブシキガイシャ')
65
+ subject.should_not include('フクスウタイオウ')
66
+ subject.should_not include('カイシャ')
63
67
  end
64
68
  end
65
69
 
metadata CHANGED
@@ -1,20 +1,18 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: officex2str
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.0.9
5
- prerelease:
4
+ version: 0.1.0
6
5
  platform: ruby
7
6
  authors:
8
7
  - interu
9
8
  autorequire:
10
9
  bindir: bin
11
10
  cert_chain: []
12
- date: 2014-07-14 00:00:00.000000000 Z
11
+ date: 2016-03-11 00:00:00.000000000 Z
13
12
  dependencies:
14
13
  - !ruby/object:Gem::Dependency
15
14
  name: rake
16
15
  requirement: !ruby/object:Gem::Requirement
17
- none: false
18
16
  requirements:
19
17
  - - '='
20
18
  - !ruby/object:Gem::Version
@@ -22,7 +20,6 @@ dependencies:
22
20
  type: :development
23
21
  prerelease: false
24
22
  version_requirements: !ruby/object:Gem::Requirement
25
- none: false
26
23
  requirements:
27
24
  - - '='
28
25
  - !ruby/object:Gem::Version
@@ -30,7 +27,6 @@ dependencies:
30
27
  - !ruby/object:Gem::Dependency
31
28
  name: rspec
32
29
  requirement: !ruby/object:Gem::Requirement
33
- none: false
34
30
  requirements:
35
31
  - - '='
36
32
  - !ruby/object:Gem::Version
@@ -38,7 +34,6 @@ dependencies:
38
34
  type: :development
39
35
  prerelease: false
40
36
  version_requirements: !ruby/object:Gem::Requirement
41
- none: false
42
37
  requirements:
43
38
  - - '='
44
39
  - !ruby/object:Gem::Version
@@ -46,49 +41,43 @@ dependencies:
46
41
  - !ruby/object:Gem::Dependency
47
42
  name: nokogiri
48
43
  requirement: !ruby/object:Gem::Requirement
49
- none: false
50
44
  requirements:
51
- - - ! '>='
45
+ - - ">="
52
46
  - !ruby/object:Gem::Version
53
47
  version: 1.4.7
54
48
  type: :runtime
55
49
  prerelease: false
56
50
  version_requirements: !ruby/object:Gem::Requirement
57
- none: false
58
51
  requirements:
59
- - - ! '>='
52
+ - - ">="
60
53
  - !ruby/object:Gem::Version
61
54
  version: 1.4.7
62
55
  - !ruby/object:Gem::Dependency
63
56
  name: rubyzip
64
57
  requirement: !ruby/object:Gem::Requirement
65
- none: false
66
58
  requirements:
67
- - - ! '>='
59
+ - - ">="
68
60
  - !ruby/object:Gem::Version
69
61
  version: '0'
70
62
  type: :runtime
71
63
  prerelease: false
72
64
  version_requirements: !ruby/object:Gem::Requirement
73
- none: false
74
65
  requirements:
75
- - - ! '>='
66
+ - - ">="
76
67
  - !ruby/object:Gem::Version
77
68
  version: '0'
78
69
  - !ruby/object:Gem::Dependency
79
70
  name: mime-types
80
71
  requirement: !ruby/object:Gem::Requirement
81
- none: false
82
72
  requirements:
83
- - - ! '>='
73
+ - - ">="
84
74
  - !ruby/object:Gem::Version
85
75
  version: '0'
86
76
  type: :runtime
87
77
  prerelease: false
88
78
  version_requirements: !ruby/object:Gem::Requirement
89
- none: false
90
79
  requirements:
91
- - - ! '>='
80
+ - - ">="
92
81
  - !ruby/object:Gem::Version
93
82
  version: '0'
94
83
  description: convert office 2010 files to str
@@ -98,7 +87,7 @@ executables: []
98
87
  extensions: []
99
88
  extra_rdoc_files: []
100
89
  files:
101
- - .gitignore
90
+ - ".gitignore"
102
91
  - Gemfile
103
92
  - LICENSE
104
93
  - README.md
@@ -114,33 +103,26 @@ files:
114
103
  - spec/spec_helper.rb
115
104
  homepage: ''
116
105
  licenses: []
106
+ metadata: {}
117
107
  post_install_message:
118
108
  rdoc_options: []
119
109
  require_paths:
120
110
  - lib
121
111
  required_ruby_version: !ruby/object:Gem::Requirement
122
- none: false
123
112
  requirements:
124
- - - ! '>='
113
+ - - ">="
125
114
  - !ruby/object:Gem::Version
126
115
  version: '0'
127
- segments:
128
- - 0
129
- hash: -2505515257273957175
130
116
  required_rubygems_version: !ruby/object:Gem::Requirement
131
- none: false
132
117
  requirements:
133
- - - ! '>='
118
+ - - ">="
134
119
  - !ruby/object:Gem::Version
135
120
  version: '0'
136
- segments:
137
- - 0
138
- hash: -2505515257273957175
139
121
  requirements: []
140
122
  rubyforge_project:
141
- rubygems_version: 1.8.23
123
+ rubygems_version: 2.2.2
142
124
  signing_key:
143
- specification_version: 3
125
+ specification_version: 4
144
126
  summary: convert office 2010 files(docx,xlsx,pptx) to str
145
127
  test_files:
146
128
  - spec/officex2str_spec.rb