cld3 3.5.0 → 3.5.1

Sign up to get free protection for your applications and to get access to all the features.
Files changed (50) hide show
  1. checksums.yaml +4 -4
  2. data/README.md +0 -8
  3. data/cld3.gemspec +6 -6
  4. data/ext/cld3/extconf.rb +1 -2
  5. data/ext/cld3/nnet_language_identifier_c.cc +162 -70
  6. data/lib/cld3.rb +14 -102
  7. data/sig/cld3.rbs +2 -0
  8. metadata +15 -77
  9. data/ext/cld3/Makefile +0 -268
  10. data/ext/cld3/base.o +0 -0
  11. data/ext/cld3/embedding_feature_extractor.o +0 -0
  12. data/ext/cld3/embedding_network.o +0 -0
  13. data/ext/cld3/feature_extractor.o +0 -0
  14. data/ext/cld3/feature_types.o +0 -0
  15. data/ext/cld3/fixunicodevalue.o +0 -0
  16. data/ext/cld3/fml_parser.o +0 -0
  17. data/ext/cld3/generated_entities.o +0 -0
  18. data/ext/cld3/generated_ulscript.o +0 -0
  19. data/ext/cld3/getonescriptspan.o +0 -0
  20. data/ext/cld3/lang_id_nn_params.o +0 -0
  21. data/ext/cld3/language_identifier_features.o +0 -0
  22. data/ext/cld3/libcld3.def +0 -8
  23. data/ext/cld3/libcld3.so +0 -0
  24. data/ext/cld3/nnet_language_identifier.o +0 -0
  25. data/ext/cld3/nnet_language_identifier_c.o +0 -0
  26. data/ext/cld3/offsetmap.o +0 -0
  27. data/ext/cld3/registry.o +0 -0
  28. data/ext/cld3/relevant_script_feature.o +0 -0
  29. data/ext/cld3/script_span/fixunicodevalue.h +0 -69
  30. data/ext/cld3/script_span/generated_ulscript.h +0 -142
  31. data/ext/cld3/script_span/getonescriptspan.h +0 -124
  32. data/ext/cld3/script_span/integral_types.h +0 -37
  33. data/ext/cld3/script_span/offsetmap.h +0 -168
  34. data/ext/cld3/script_span/port.h +0 -143
  35. data/ext/cld3/script_span/stringpiece.h +0 -81
  36. data/ext/cld3/script_span/text_processing.h +0 -30
  37. data/ext/cld3/script_span/utf8acceptinterchange.h +0 -486
  38. data/ext/cld3/script_span/utf8prop_lettermarkscriptnum.h +0 -1631
  39. data/ext/cld3/script_span/utf8repl_lettermarklower.h +0 -758
  40. data/ext/cld3/script_span/utf8scannot_lettermarkspecial.h +0 -1455
  41. data/ext/cld3/script_span/utf8statetable.h +0 -285
  42. data/ext/cld3/sentence_features.o +0 -0
  43. data/ext/cld3/task_context.o +0 -0
  44. data/ext/cld3/task_context_params.o +0 -0
  45. data/ext/cld3/text_processing.o +0 -0
  46. data/ext/cld3/unicodetext.o +0 -0
  47. data/ext/cld3/utf8statetable.o +0 -0
  48. data/ext/cld3/utils.o +0 -0
  49. data/ext/cld3/workspace.o +0 -0
  50. data/lib/cld3/unstable.rb +0 -58
metadata CHANGED
@@ -1,95 +1,75 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: cld3
3
3
  version: !ruby/object:Gem::Version
4
- version: 3.5.0
4
+ version: 3.5.1
5
5
  platform: ruby
6
6
  authors:
7
7
  - Akihiko Odaki
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2022-07-19 00:00:00.000000000 Z
11
+ date: 2023-02-21 00:00:00.000000000 Z
12
12
  dependencies:
13
- - !ruby/object:Gem::Dependency
14
- name: ffi
15
- requirement: !ruby/object:Gem::Requirement
16
- requirements:
17
- - - ">="
18
- - !ruby/object:Gem::Version
19
- version: 1.1.0
20
- - - "<"
21
- - !ruby/object:Gem::Version
22
- version: 1.16.0
23
- type: :runtime
24
- prerelease: false
25
- version_requirements: !ruby/object:Gem::Requirement
26
- requirements:
27
- - - ">="
28
- - !ruby/object:Gem::Version
29
- version: 1.1.0
30
- - - "<"
31
- - !ruby/object:Gem::Version
32
- version: 1.16.0
33
13
  - !ruby/object:Gem::Dependency
34
14
  name: rbs
35
15
  requirement: !ruby/object:Gem::Requirement
36
16
  requirements:
37
17
  - - ">="
38
18
  - !ruby/object:Gem::Version
39
- version: 2.6.0
19
+ version: 2.8.0
40
20
  - - "<"
41
21
  - !ruby/object:Gem::Version
42
- version: 2.7.0
22
+ version: 2.9.0
43
23
  type: :development
44
24
  prerelease: false
45
25
  version_requirements: !ruby/object:Gem::Requirement
46
26
  requirements:
47
27
  - - ">="
48
28
  - !ruby/object:Gem::Version
49
- version: 2.6.0
29
+ version: 2.8.0
50
30
  - - "<"
51
31
  - !ruby/object:Gem::Version
52
- version: 2.7.0
32
+ version: 2.9.0
53
33
  - !ruby/object:Gem::Dependency
54
34
  name: rspec
55
35
  requirement: !ruby/object:Gem::Requirement
56
36
  requirements:
57
37
  - - ">="
58
38
  - !ruby/object:Gem::Version
59
- version: 3.11.0
39
+ version: 3.12.0
60
40
  - - "<"
61
41
  - !ruby/object:Gem::Version
62
- version: 3.12.0
42
+ version: 3.13.0
63
43
  type: :development
64
44
  prerelease: false
65
45
  version_requirements: !ruby/object:Gem::Requirement
66
46
  requirements:
67
47
  - - ">="
68
48
  - !ruby/object:Gem::Version
69
- version: 3.11.0
49
+ version: 3.12.0
70
50
  - - "<"
71
51
  - !ruby/object:Gem::Version
72
- version: 3.12.0
52
+ version: 3.13.0
73
53
  - !ruby/object:Gem::Dependency
74
54
  name: steep
75
55
  requirement: !ruby/object:Gem::Requirement
76
56
  requirements:
77
57
  - - ">="
78
58
  - !ruby/object:Gem::Version
79
- version: 1.0.0
59
+ version: 1.3.0
80
60
  - - "<"
81
61
  - !ruby/object:Gem::Version
82
- version: 1.1.0
62
+ version: 1.4.0
83
63
  type: :development
84
64
  prerelease: false
85
65
  version_requirements: !ruby/object:Gem::Requirement
86
66
  requirements:
87
67
  - - ">="
88
68
  - !ruby/object:Gem::Version
89
- version: 1.0.0
69
+ version: 1.3.0
90
70
  - - "<"
91
71
  - !ruby/object:Gem::Version
92
- version: 1.1.0
72
+ version: 1.4.0
93
73
  description: Compact Language Detector v3 (CLD3) is a neural network model for language
94
74
  identification.
95
75
  email: akihiko.odaki@gmail.com
@@ -103,113 +83,71 @@ files:
103
83
  - LICENSE_CLD3
104
84
  - README.md
105
85
  - cld3.gemspec
106
- - ext/cld3/Makefile
107
86
  - ext/cld3/base.cc
108
87
  - ext/cld3/base.h
109
- - ext/cld3/base.o
110
88
  - ext/cld3/casts.h
111
89
  - ext/cld3/cld_3/protos/feature_extractor.pb.h
112
90
  - ext/cld3/cld_3/protos/sentence.pb.h
113
91
  - ext/cld3/cld_3/protos/task_spec.pb.h
114
92
  - ext/cld3/embedding_feature_extractor.cc
115
93
  - ext/cld3/embedding_feature_extractor.h
116
- - ext/cld3/embedding_feature_extractor.o
117
94
  - ext/cld3/embedding_network.cc
118
95
  - ext/cld3/embedding_network.h
119
- - ext/cld3/embedding_network.o
120
96
  - ext/cld3/embedding_network_params.h
121
97
  - ext/cld3/extconf.rb
122
98
  - ext/cld3/feature_extractor.cc
123
99
  - ext/cld3/feature_extractor.h
124
- - ext/cld3/feature_extractor.o
125
100
  - ext/cld3/feature_types.cc
126
101
  - ext/cld3/feature_types.h
127
- - ext/cld3/feature_types.o
128
102
  - ext/cld3/fixunicodevalue.cc
129
103
  - ext/cld3/fixunicodevalue.h
130
- - ext/cld3/fixunicodevalue.o
131
104
  - ext/cld3/float16.h
132
105
  - ext/cld3/fml_parser.cc
133
106
  - ext/cld3/fml_parser.h
134
- - ext/cld3/fml_parser.o
135
107
  - ext/cld3/generated_entities.cc
136
- - ext/cld3/generated_entities.o
137
108
  - ext/cld3/generated_ulscript.cc
138
109
  - ext/cld3/generated_ulscript.h
139
- - ext/cld3/generated_ulscript.o
140
110
  - ext/cld3/getonescriptspan.cc
141
111
  - ext/cld3/getonescriptspan.h
142
- - ext/cld3/getonescriptspan.o
143
112
  - ext/cld3/integral_types.h
144
113
  - ext/cld3/lang_id_nn_params.cc
145
114
  - ext/cld3/lang_id_nn_params.h
146
- - ext/cld3/lang_id_nn_params.o
147
115
  - ext/cld3/language_identifier_features.cc
148
116
  - ext/cld3/language_identifier_features.h
149
- - ext/cld3/language_identifier_features.o
150
- - ext/cld3/libcld3.def
151
- - ext/cld3/libcld3.so
152
117
  - ext/cld3/nnet_language_identifier.cc
153
118
  - ext/cld3/nnet_language_identifier.h
154
- - ext/cld3/nnet_language_identifier.o
155
119
  - ext/cld3/nnet_language_identifier_c.cc
156
- - ext/cld3/nnet_language_identifier_c.o
157
120
  - ext/cld3/offsetmap.cc
158
121
  - ext/cld3/offsetmap.h
159
- - ext/cld3/offsetmap.o
160
122
  - ext/cld3/port.h
161
123
  - ext/cld3/registry.cc
162
124
  - ext/cld3/registry.h
163
- - ext/cld3/registry.o
164
125
  - ext/cld3/relevant_script_feature.cc
165
126
  - ext/cld3/relevant_script_feature.h
166
- - ext/cld3/relevant_script_feature.o
167
127
  - ext/cld3/script_detector.h
168
- - ext/cld3/script_span/fixunicodevalue.h
169
- - ext/cld3/script_span/generated_ulscript.h
170
- - ext/cld3/script_span/getonescriptspan.h
171
- - ext/cld3/script_span/integral_types.h
172
- - ext/cld3/script_span/offsetmap.h
173
- - ext/cld3/script_span/port.h
174
- - ext/cld3/script_span/stringpiece.h
175
- - ext/cld3/script_span/text_processing.h
176
- - ext/cld3/script_span/utf8acceptinterchange.h
177
- - ext/cld3/script_span/utf8prop_lettermarkscriptnum.h
178
- - ext/cld3/script_span/utf8repl_lettermarklower.h
179
- - ext/cld3/script_span/utf8scannot_lettermarkspecial.h
180
- - ext/cld3/script_span/utf8statetable.h
181
128
  - ext/cld3/sentence_features.cc
182
129
  - ext/cld3/sentence_features.h
183
- - ext/cld3/sentence_features.o
184
130
  - ext/cld3/simple_adder.h
185
131
  - ext/cld3/stringpiece.h
186
132
  - ext/cld3/task_context.cc
187
133
  - ext/cld3/task_context.h
188
- - ext/cld3/task_context.o
189
134
  - ext/cld3/task_context_params.cc
190
135
  - ext/cld3/task_context_params.h
191
- - ext/cld3/task_context_params.o
192
136
  - ext/cld3/text_processing.cc
193
137
  - ext/cld3/text_processing.h
194
- - ext/cld3/text_processing.o
195
138
  - ext/cld3/unicodetext.cc
196
139
  - ext/cld3/unicodetext.h
197
- - ext/cld3/unicodetext.o
198
140
  - ext/cld3/utf8acceptinterchange.h
199
141
  - ext/cld3/utf8prop_lettermarkscriptnum.h
200
142
  - ext/cld3/utf8repl_lettermarklower.h
201
143
  - ext/cld3/utf8scannot_lettermarkspecial.h
202
144
  - ext/cld3/utf8statetable.cc
203
145
  - ext/cld3/utf8statetable.h
204
- - ext/cld3/utf8statetable.o
205
146
  - ext/cld3/utils.cc
206
147
  - ext/cld3/utils.h
207
- - ext/cld3/utils.o
208
148
  - ext/cld3/workspace.cc
209
149
  - ext/cld3/workspace.h
210
- - ext/cld3/workspace.o
211
150
  - lib/cld3.rb
212
- - lib/cld3/unstable.rb
213
151
  - sig/cld3.rbs
214
152
  homepage: https://github.com/akihikodaki/cld3-ruby
215
153
  licenses:
@@ -233,7 +171,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
233
171
  - !ruby/object:Gem::Version
234
172
  version: '0'
235
173
  requirements: []
236
- rubygems_version: 3.3.7
174
+ rubygems_version: 3.3.25
237
175
  signing_key:
238
176
  specification_version: 4
239
177
  summary: Compact Language Detector v3 (CLD3)
data/ext/cld3/Makefile DELETED
@@ -1,268 +0,0 @@
1
-
2
- SHELL = /bin/sh
3
-
4
- # V=0 quiet, V=1 verbose. other values don't work.
5
- V = 1
6
- V0 = $(V:0=)
7
- Q1 = $(V:1=)
8
- Q = $(Q1:0=@)
9
- ECHO1 = $(V:1=@ :)
10
- ECHO = $(ECHO1:0=@ echo)
11
- NULLCMD = :
12
-
13
- #### Start of system configuration section. ####
14
-
15
- srcdir = .
16
- topdir = /usr/include
17
- hdrdir = $(topdir)
18
- arch_hdrdir = /usr/include
19
- PATH_SEPARATOR = :
20
- VPATH = $(srcdir):$(arch_hdrdir)/ruby:$(hdrdir)/ruby
21
- prefix = $(DESTDIR)/usr
22
- rubysitearchprefix = $(sitearchlibdir)/$(RUBY_BASE_NAME)
23
- rubyarchprefix = $(DESTDIR)/usr/lib64/ruby
24
- rubylibprefix = $(exec_prefix)/share/ruby
25
- exec_prefix = $(DESTDIR)/usr
26
- vendorarchhdrdir = $(vendorhdrdir)/$(arch)
27
- sitearchhdrdir = $(sitehdrdir)/$(arch)
28
- rubyarchhdrdir = $(DESTDIR)/usr/include
29
- vendorhdrdir = $(rubyhdrdir)/vendor_ruby
30
- sitehdrdir = $(rubyhdrdir)/site_ruby
31
- rubyhdrdir = $(DESTDIR)/usr/include
32
- rubygemsdir = $(DESTDIR)/usr/share/rubygems
33
- vendorarchdir = $(DESTDIR)/usr/lib64/ruby/vendor_ruby
34
- vendorlibdir = $(vendordir)
35
- vendordir = $(DESTDIR)/usr/share/ruby/vendor_ruby
36
- sitearchdir = $(DESTDIR)/usr/local/lib64/ruby/site_ruby
37
- sitelibdir = $(sitedir)
38
- sitedir = $(DESTDIR)/usr/local/share/ruby/site_ruby
39
- rubyarchdir = $(rubyarchprefix)
40
- rubylibdir = $(rubylibprefix)
41
- sitearchincludedir = $(includedir)/$(sitearch)
42
- archincludedir = $(includedir)/$(arch)
43
- sitearchlibdir = $(libdir)/$(sitearch)
44
- archlibdir = $(DESTDIR)/usr/lib64
45
- ridir = $(datarootdir)/$(RI_BASE_NAME)
46
- mandir = $(DESTDIR)/usr/share/man
47
- localedir = $(datarootdir)/locale
48
- libdir = $(exec_prefix)/lib64
49
- psdir = $(docdir)
50
- pdfdir = $(docdir)
51
- dvidir = $(docdir)
52
- htmldir = $(docdir)
53
- infodir = $(DESTDIR)/usr/share/info
54
- docdir = $(datarootdir)/doc/$(PACKAGE)
55
- oldincludedir = $(DESTDIR)/usr/include
56
- includedir = $(exec_prefix)/include
57
- runstatedir = $(localstatedir)/run
58
- localstatedir = $(DESTDIR)/var
59
- sharedstatedir = $(DESTDIR)/var/lib
60
- sysconfdir = $(DESTDIR)/etc
61
- datadir = $(DESTDIR)/usr/share
62
- datarootdir = $(prefix)/share
63
- libexecdir = $(DESTDIR)/usr/libexec
64
- sbindir = $(DESTDIR)/usr/sbin
65
- bindir = $(exec_prefix)/bin
66
- archdir = $(rubyarchdir)
67
-
68
-
69
- CC_WRAPPER =
70
- CC = gcc
71
- CXX = g++
72
- LIBRUBY = $(LIBRUBY_SO)
73
- LIBRUBY_A = lib$(RUBY_SO_NAME)-static.a
74
- LIBRUBYARG_SHARED = -l$(RUBY_SO_NAME)
75
- LIBRUBYARG_STATIC = -l$(RUBY_SO_NAME)-static $(MAINLIBS)
76
- empty =
77
- OUTFLAG = -o $(empty)
78
- COUTFLAG = -o $(empty)
79
- CSRCFLAG = $(empty)
80
-
81
- RUBY_EXTCONF_H =
82
- cflags = $(optflags) $(debugflags) $(warnflags)
83
- cxxflags =
84
- optflags = -O3 -fno-fast-math
85
- debugflags = -ggdb3
86
- warnflags = -Wall -Wextra -Wdeprecated-declarations -Wduplicated-cond -Wimplicit-function-declaration -Wimplicit-int -Wmisleading-indentation -Wpointer-arith -Wwrite-strings -Wold-style-definition -Wimplicit-fallthrough=0 -Wmissing-noreturn -Wno-cast-function-type -Wno-constant-logical-operand -Wno-long-long -Wno-missing-field-initializers -Wno-overlength-strings -Wno-packed-bitfield-compat -Wno-parentheses-equality -Wno-self-assign -Wno-tautological-compare -Wno-unused-parameter -Wno-unused-value -Wsuggest-attribute=format -Wsuggest-attribute=noreturn -Wunused-variable -Wundef
87
- cppflags =
88
- CCDLFLAGS = -fPIC
89
- CFLAGS = $(CCDLFLAGS) -O2 -flto=auto -ffat-lto-objects -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-D_FORTIFY_SOURCE=2 -Wp,-D_GLIBCXX_ASSERTIONS -specs=/usr/lib/rpm/redhat/redhat-hardened-cc1 -fstack-protector-strong -specs=/usr/lib/rpm/redhat/redhat-annobin-cc1 -mbranch-protection=standard -fasynchronous-unwind-tables -fstack-clash-protection -fPIC $(ARCH_FLAG)
90
- INCFLAGS = -I. -I$(arch_hdrdir) -I$(hdrdir)/ruby/backward -I$(hdrdir) -I$(srcdir)
91
- DEFS =
92
- CPPFLAGS = $(DEFS) $(cppflags)
93
- CXXFLAGS = $(CCDLFLAGS) -O2 -flto=auto -ffat-lto-objects -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-D_FORTIFY_SOURCE=2 -Wp,-D_GLIBCXX_ASSERTIONS -specs=/usr/lib/rpm/redhat/redhat-hardened-cc1 -fstack-protector-strong -specs=/usr/lib/rpm/redhat/redhat-annobin-cc1 -mbranch-protection=standard -fasynchronous-unwind-tables -fstack-clash-protection -fvisibility=hidden -std=c++17 $(ARCH_FLAG)
94
- ldflags = -L. -Wl,-z,relro -Wl,--as-needed -Wl,-z,now -specs=/usr/lib/rpm/redhat/redhat-hardened-ld -specs=/usr/lib/rpm/redhat/redhat-annobin-cc1 -Wl,--build-id=sha1 -fstack-protector-strong -rdynamic -Wl,-export-dynamic -Wl,--no-as-needed
95
- dldflags = -Wl,-z,relro -Wl,--as-needed -Wl,-z,now -specs=/usr/lib/rpm/redhat/redhat-hardened-ld -specs=/usr/lib/rpm/redhat/redhat-annobin-cc1 -Wl,--build-id=sha1
96
- ARCH_FLAG =
97
- DLDFLAGS = $(ldflags) $(dldflags) $(ARCH_FLAG)
98
- LDSHARED = $(CC) -shared
99
- LDSHAREDXX = $(CXX) -shared
100
- AR = gcc-ar
101
- EXEEXT =
102
-
103
- RUBY_INSTALL_NAME = $(RUBY_BASE_NAME)
104
- RUBY_SO_NAME = ruby
105
- RUBYW_INSTALL_NAME =
106
- RUBY_VERSION_NAME = $(RUBY_BASE_NAME)-$(ruby_version_dir_name)
107
- RUBYW_BASE_NAME = rubyw
108
- RUBY_BASE_NAME = ruby
109
-
110
- arch = aarch64-linux
111
- sitearch = $(arch)
112
- ruby_version = 3.1.0
113
- ruby = $(bindir)/$(RUBY_BASE_NAME)
114
- RUBY = $(ruby)
115
- ruby_headers = $(hdrdir)/ruby.h $(hdrdir)/ruby/backward.h $(hdrdir)/ruby/ruby.h $(hdrdir)/ruby/defines.h $(hdrdir)/ruby/missing.h $(hdrdir)/ruby/intern.h $(hdrdir)/ruby/st.h $(hdrdir)/ruby/subst.h $(arch_hdrdir)/ruby/config.h
116
-
117
- RM = rm -f
118
- RM_RF = rm -fr
119
- RMDIRS = rmdir --ignore-fail-on-non-empty -p
120
- MAKEDIRS = /usr/bin/mkdir -p
121
- INSTALL = /usr/bin/install -c
122
- INSTALL_PROG = $(INSTALL) -m 0755
123
- INSTALL_DATA = $(INSTALL) -m 644
124
- COPY = cp
125
- TOUCH = exit >
126
-
127
- #### End of system configuration section. ####
128
-
129
- preload =
130
- libpath = . $(archlibdir)
131
- LIBPATH = -L. -L$(archlibdir)
132
- DEFFILE =
133
-
134
- CLEANFILES = mkmf.log
135
- DISTCLEANFILES =
136
- DISTCLEANDIRS =
137
-
138
- extout =
139
- extout_prefix =
140
- target_prefix =
141
- LOCAL_LIBS =
142
- LIBS = -lm -lc
143
- ORIG_SRCS = base.cc embedding_feature_extractor.cc embedding_network.cc feature_extractor.cc feature_types.cc fixunicodevalue.cc fml_parser.cc generated_entities.cc generated_ulscript.cc getonescriptspan.cc lang_id_nn_params.cc language_identifier_features.cc nnet_language_identifier.cc nnet_language_identifier_c.cc offsetmap.cc registry.cc relevant_script_feature.cc sentence_features.cc task_context.cc task_context_params.cc text_processing.cc unicodetext.cc utf8statetable.cc utils.cc workspace.cc
144
- SRCS = $(ORIG_SRCS)
145
- OBJS = base.o embedding_feature_extractor.o embedding_network.o feature_extractor.o feature_types.o fixunicodevalue.o fml_parser.o generated_entities.o generated_ulscript.o getonescriptspan.o lang_id_nn_params.o language_identifier_features.o nnet_language_identifier.o nnet_language_identifier_c.o offsetmap.o registry.o relevant_script_feature.o sentence_features.o task_context.o task_context_params.o text_processing.o unicodetext.o utf8statetable.o utils.o workspace.o
146
- HDRS = $(srcdir)/base.h $(srcdir)/casts.h $(srcdir)/embedding_feature_extractor.h $(srcdir)/embedding_network.h $(srcdir)/embedding_network_params.h $(srcdir)/feature_extractor.h $(srcdir)/feature_types.h $(srcdir)/fixunicodevalue.h $(srcdir)/float16.h $(srcdir)/fml_parser.h $(srcdir)/generated_ulscript.h $(srcdir)/getonescriptspan.h $(srcdir)/integral_types.h $(srcdir)/lang_id_nn_params.h $(srcdir)/language_identifier_features.h $(srcdir)/nnet_language_identifier.h $(srcdir)/offsetmap.h $(srcdir)/port.h $(srcdir)/registry.h $(srcdir)/relevant_script_feature.h $(srcdir)/script_detector.h $(srcdir)/sentence_features.h $(srcdir)/simple_adder.h $(srcdir)/stringpiece.h $(srcdir)/task_context.h $(srcdir)/task_context_params.h $(srcdir)/text_processing.h $(srcdir)/unicodetext.h $(srcdir)/utf8acceptinterchange.h $(srcdir)/utf8prop_lettermarkscriptnum.h $(srcdir)/utf8repl_lettermarklower.h $(srcdir)/utf8scannot_lettermarkspecial.h $(srcdir)/utf8statetable.h $(srcdir)/utils.h $(srcdir)/workspace.h
147
- LOCAL_HDRS =
148
- TARGET = libcld3
149
- TARGET_NAME = libcld3
150
- TARGET_ENTRY = Init_$(TARGET_NAME)
151
- DLLIB = $(TARGET).so
152
- EXTSTATIC =
153
- STATIC_LIB =
154
-
155
- TIMESTAMP_DIR = .
156
- BINDIR = $(bindir)
157
- RUBYCOMMONDIR = $(sitedir)$(target_prefix)
158
- RUBYLIBDIR = $(sitelibdir)$(target_prefix)
159
- RUBYARCHDIR = $(sitearchdir)$(target_prefix)
160
- HDRDIR = $(sitehdrdir)$(target_prefix)
161
- ARCHHDRDIR = $(sitearchhdrdir)$(target_prefix)
162
- TARGET_SO_DIR =
163
- TARGET_SO = $(TARGET_SO_DIR)$(DLLIB)
164
- CLEANLIBS = $(TARGET_SO) false
165
- CLEANOBJS = *.o *.bak
166
-
167
- all: $(DLLIB)
168
- static: $(STATIC_LIB)
169
- .PHONY: all install static install-so install-rb
170
- .PHONY: clean clean-so clean-static clean-rb
171
-
172
- clean-static::
173
- clean-rb-default::
174
- clean-rb::
175
- clean-so::
176
- clean: clean-so clean-static clean-rb-default clean-rb
177
- -$(Q)$(RM_RF) $(CLEANLIBS) $(CLEANOBJS) $(CLEANFILES) .*.time
178
-
179
- distclean-rb-default::
180
- distclean-rb::
181
- distclean-so::
182
- distclean-static::
183
- distclean: clean distclean-so distclean-static distclean-rb-default distclean-rb
184
- -$(Q)$(RM) Makefile $(RUBY_EXTCONF_H) conftest.* mkmf.log
185
- -$(Q)$(RM) core ruby$(EXEEXT) *~ $(DISTCLEANFILES)
186
- -$(Q)$(RMDIRS) $(DISTCLEANDIRS) 2> /dev/null || true
187
-
188
- realclean: distclean
189
- install: install-so install-rb
190
-
191
- install-so: $(DLLIB) $(TIMESTAMP_DIR)/.sitearchdir.time
192
- $(INSTALL_PROG) $(DLLIB) $(RUBYARCHDIR)
193
- clean-static::
194
- -$(Q)$(RM) $(STATIC_LIB)
195
- install-rb: pre-install-rb do-install-rb install-rb-default
196
- install-rb-default: pre-install-rb-default do-install-rb-default
197
- pre-install-rb: Makefile
198
- pre-install-rb-default: Makefile
199
- do-install-rb:
200
- do-install-rb-default:
201
- pre-install-rb-default:
202
- @$(NULLCMD)
203
- $(TIMESTAMP_DIR)/.sitearchdir.time:
204
- $(Q) $(MAKEDIRS) $(@D) $(RUBYARCHDIR)
205
- $(Q) $(TOUCH) $@
206
-
207
- site-install: site-install-so site-install-rb
208
- site-install-so: install-so
209
- site-install-rb: install-rb
210
-
211
- .SUFFIXES: .c .m .cc .mm .cxx .cpp .o .S
212
-
213
- .cc.o:
214
- $(ECHO) compiling $(<)
215
- $(Q) $(CXX) $(INCFLAGS) $(CPPFLAGS) $(CXXFLAGS) $(COUTFLAG)$@ -c $(CSRCFLAG)$<
216
-
217
- .cc.S:
218
- $(ECHO) translating $(<)
219
- $(Q) $(CXX) $(INCFLAGS) $(CPPFLAGS) $(CXXFLAGS) $(COUTFLAG)$@ -S $(CSRCFLAG)$<
220
-
221
- .mm.o:
222
- $(ECHO) compiling $(<)
223
- $(Q) $(CXX) $(INCFLAGS) $(CPPFLAGS) $(CXXFLAGS) $(COUTFLAG)$@ -c $(CSRCFLAG)$<
224
-
225
- .mm.S:
226
- $(ECHO) translating $(<)
227
- $(Q) $(CXX) $(INCFLAGS) $(CPPFLAGS) $(CXXFLAGS) $(COUTFLAG)$@ -S $(CSRCFLAG)$<
228
-
229
- .cxx.o:
230
- $(ECHO) compiling $(<)
231
- $(Q) $(CXX) $(INCFLAGS) $(CPPFLAGS) $(CXXFLAGS) $(COUTFLAG)$@ -c $(CSRCFLAG)$<
232
-
233
- .cxx.S:
234
- $(ECHO) translating $(<)
235
- $(Q) $(CXX) $(INCFLAGS) $(CPPFLAGS) $(CXXFLAGS) $(COUTFLAG)$@ -S $(CSRCFLAG)$<
236
-
237
- .cpp.o:
238
- $(ECHO) compiling $(<)
239
- $(Q) $(CXX) $(INCFLAGS) $(CPPFLAGS) $(CXXFLAGS) $(COUTFLAG)$@ -c $(CSRCFLAG)$<
240
-
241
- .cpp.S:
242
- $(ECHO) translating $(<)
243
- $(Q) $(CXX) $(INCFLAGS) $(CPPFLAGS) $(CXXFLAGS) $(COUTFLAG)$@ -S $(CSRCFLAG)$<
244
-
245
- .c.o:
246
- $(ECHO) compiling $(<)
247
- $(Q) $(CC) $(INCFLAGS) $(CPPFLAGS) $(CFLAGS) $(COUTFLAG)$@ -c $(CSRCFLAG)$<
248
-
249
- .c.S:
250
- $(ECHO) translating $(<)
251
- $(Q) $(CC) $(INCFLAGS) $(CPPFLAGS) $(CFLAGS) $(COUTFLAG)$@ -S $(CSRCFLAG)$<
252
-
253
- .m.o:
254
- $(ECHO) compiling $(<)
255
- $(Q) $(CC) $(INCFLAGS) $(CPPFLAGS) $(CFLAGS) $(COUTFLAG)$@ -c $(CSRCFLAG)$<
256
-
257
- .m.S:
258
- $(ECHO) translating $(<)
259
- $(Q) $(CC) $(INCFLAGS) $(CPPFLAGS) $(CFLAGS) $(COUTFLAG)$@ -S $(CSRCFLAG)$<
260
-
261
- $(TARGET_SO): $(OBJS) Makefile
262
- $(ECHO) linking shared-object $(DLLIB)
263
- -$(Q)$(RM) $(@)
264
- $(Q) $(LDSHAREDXX) -o $@ $(OBJS) $(LIBPATH) $(DLDFLAGS) $(LOCAL_LIBS) $(LIBS)
265
-
266
-
267
-
268
- $(OBJS): $(HDRS) $(ruby_headers)
data/ext/cld3/base.o DELETED
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
data/ext/cld3/libcld3.def DELETED
@@ -1,8 +0,0 @@
1
- EXPORTS
2
- NNetLanguageIdentifier_find_language
3
- NNetLanguageIdentifier_find_top_n_most_freq_langs
4
- delete_NNetLanguageIdentifier
5
- delete_result
6
- delete_results
7
- new_NNetLanguageIdentifier
8
- refer_to_nth_result
data/ext/cld3/libcld3.so DELETED
Binary file
Binary file
Binary file
data/ext/cld3/offsetmap.o DELETED
Binary file
data/ext/cld3/registry.o DELETED
Binary file
Binary file
@@ -1,69 +0,0 @@
1
- // Copyright 2013 Google Inc. All Rights Reserved.
2
- //
3
- // Licensed under the Apache License, Version 2.0 (the "License");
4
- // you may not use this file except in compliance with the License.
5
- // You may obtain a copy of the License at
6
- //
7
- // http://www.apache.org/licenses/LICENSE-2.0
8
- //
9
- // Unless required by applicable law or agreed to in writing, software
10
- // distributed under the License is distributed on an "AS IS" BASIS,
11
- // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
- // See the License for the specific language governing permissions and
13
- // limitations under the License.
14
-
15
- //
16
- // Routine that maps a Unicode code point to an interchange-valid one
17
- //
18
- // Table that maps MS CP1252 bytes 00-FF to their corresponding Unicode
19
- // code points. C0 and C1 control codes that are not interchange-valid
20
- // are mapped to spaces.
21
-
22
-
23
- #ifndef SCRIPT_SPAN_FIXUNICODEVALUE_H_
24
- #define SCRIPT_SPAN_FIXUNICODEVALUE_H_
25
-
26
- #include "integral_types.h" // for char32
27
- #include "port.h"
28
-
29
- namespace chrome_lang_id {
30
- namespace CLD2 {
31
-
32
- // Map byte value 0000-00FF to char32
33
- // Maps C0 control codes (other than CR LF HT FF) to space [29 instances including DEL=0x7F]
34
- // Maps C1 control codes to CP1252 [27 instances] or space [5 instances]
35
- static const char32 kMapFullMicrosoft1252OrSpace[256] = {
36
- 0x20,0x20,0x20,0x20, 0x20,0x20,0x20,0x20, 0x20,0x09,0x0a,0x20, 0x0c,0x0d,0x20,0x20, // 00
37
- 0x20,0x20,0x20,0x20, 0x20,0x20,0x20,0x20, 0x20,0x20,0x20,0x20, 0x20,0x20,0x20,0x20,
38
- 0x20,0x21,0x22,0x23, 0x24,0x25,0x26,0x27, 0x28,0x29,0x2a,0x2b, 0x2c,0x2d,0x2e,0x2f,
39
- 0x30,0x31,0x32,0x33, 0x34,0x35,0x36,0x37, 0x38,0x39,0x3a,0x3b, 0x3c,0x3d,0x3e,0x3f,
40
-
41
- 0x40,0x41,0x42,0x43, 0x44,0x45,0x46,0x47, 0x48,0x49,0x4a,0x4b, 0x4c,0x4d,0x4e,0x4f, // 40
42
- 0x50,0x51,0x52,0x53, 0x54,0x55,0x56,0x57, 0x58,0x59,0x5a,0x5b, 0x5c,0x5d,0x5e,0x5f,
43
- 0x60,0x61,0x62,0x63, 0x64,0x65,0x66,0x67, 0x68,0x69,0x6a,0x6b, 0x6c,0x6d,0x6e,0x6f,
44
- 0x70,0x71,0x72,0x73, 0x74,0x75,0x76,0x77, 0x78,0x79,0x7a,0x7b, 0x7c,0x7d,0x7e,0x20,
45
-
46
- 0x20ac,0x20,0x201a,0x0192, 0x201e,0x2026,0x2020,0x2021, // 80
47
- 0x02c6,0x2030,0x0160,0x2039, 0x0152,0x20,0x017d,0x20,
48
- 0x20,0x2018,0x2019,0x201c, 0x201d,0x2022,0x2013,0x2014,
49
- 0x02dc,0x2122,0x0161,0x203a, 0x0153,0x20,0x017e,0x0178,
50
- 0xa0,0xa1,0xa2,0xa3, 0xa4,0xa5,0xa6,0xa7, 0xa8,0xa9,0xaa,0xab, 0xac,0xad,0xae,0xaf, // A0
51
- 0xb0,0xb1,0xb2,0xb3, 0xb4,0xb5,0xb6,0xb7, 0xb8,0xb9,0xba,0xbb, 0xbc,0xbd,0xbe,0xbf,
52
-
53
- 0xc0,0xc1,0xc2,0xc3, 0xc4,0xc5,0xc6,0xc7, 0xc8,0xc9,0xca,0xcb, 0xcc,0xcd,0xce,0xcf, // C0
54
- 0xd0,0xd1,0xd2,0xd3, 0xd4,0xd5,0xd6,0xd7, 0xd8,0xd9,0xda,0xdb, 0xdc,0xdd,0xde,0xdf,
55
- 0xe0,0xe1,0xe2,0xe3, 0xe4,0xe5,0xe6,0xe7, 0xe8,0xe9,0xea,0xeb, 0xec,0xed,0xee,0xef,
56
- 0xf0,0xf1,0xf2,0xf3, 0xf4,0xf5,0xf6,0xf7, 0xf8,0xf9,0xfa,0xfb, 0xfc,0xfd,0xfe,0xff,
57
- };
58
-
59
- // Guarantees that the resulting output value is interchange valid
60
- // 00-FF; map to spaces or MS CP1252
61
- // D800-DFFF; surrogates
62
- // FDD0-FDEF; non-characters
63
- // xxFFFE-xxFFFF; non-characters
64
- char32 FixUnicodeValue(char32 uv);
65
-
66
- } // End namespace CLD2
67
- } // End namespace chrome_lang_id
68
-
69
- #endif // SCRIPT_SPAN_FIXUNICODEVALUE_H_