ooxml_crypt 0.1.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (264) hide show
  1. checksums.yaml +7 -0
  2. data/Gemfile +4 -0
  3. data/LICENSE.txt +21 -0
  4. data/README.md +58 -0
  5. data/Rakefile +12 -0
  6. data/bin/console +15 -0
  7. data/bin/setup +8 -0
  8. data/ext/ooxml_crypt/extconf.rb +18 -0
  9. data/ext/ooxml_crypt/ooxml_crypt.c +27 -0
  10. data/ext/ooxml_crypt/ooxml_crypt.h +7 -0
  11. data/lib/ooxml_crypt/version.rb +5 -0
  12. data/lib/ooxml_crypt.rb +75 -0
  13. data/vendor/cybozulib/.github/workflows/main.yml +12 -0
  14. data/vendor/cybozulib/.gitignore +5 -0
  15. data/vendor/cybozulib/CMakeLists.txt +6 -0
  16. data/vendor/cybozulib/COPYRIGHT +27 -0
  17. data/vendor/cybozulib/Makefile +26 -0
  18. data/vendor/cybozulib/bin/libeay32.dll +0 -0
  19. data/vendor/cybozulib/bin/libmecab.dll +0 -0
  20. data/vendor/cybozulib/bin/ssleay32.dll +0 -0
  21. data/vendor/cybozulib/common.mk +116 -0
  22. data/vendor/cybozulib/common.props +25 -0
  23. data/vendor/cybozulib/cybozulib.sln +286 -0
  24. data/vendor/cybozulib/debug.props +14 -0
  25. data/vendor/cybozulib/include/cybozu/array.hpp +197 -0
  26. data/vendor/cybozulib/include/cybozu/atoi.hpp +238 -0
  27. data/vendor/cybozulib/include/cybozu/atomic.hpp +146 -0
  28. data/vendor/cybozulib/include/cybozu/base64.hpp +210 -0
  29. data/vendor/cybozulib/include/cybozu/benchmark.hpp +212 -0
  30. data/vendor/cybozulib/include/cybozu/bfd.hpp +105 -0
  31. data/vendor/cybozulib/include/cybozu/bit_operation.hpp +139 -0
  32. data/vendor/cybozulib/include/cybozu/bitvector.hpp +358 -0
  33. data/vendor/cybozulib/include/cybozu/condition_variable.hpp +113 -0
  34. data/vendor/cybozulib/include/cybozu/condition_variable_cs.hpp +74 -0
  35. data/vendor/cybozulib/include/cybozu/config.hpp +392 -0
  36. data/vendor/cybozulib/include/cybozu/critical_section.hpp +60 -0
  37. data/vendor/cybozulib/include/cybozu/crypto.hpp +321 -0
  38. data/vendor/cybozulib/include/cybozu/csucvector.hpp +624 -0
  39. data/vendor/cybozulib/include/cybozu/csv.hpp +294 -0
  40. data/vendor/cybozulib/include/cybozu/data_type.hpp +27 -0
  41. data/vendor/cybozulib/include/cybozu/endian.hpp +224 -0
  42. data/vendor/cybozulib/include/cybozu/env.hpp +63 -0
  43. data/vendor/cybozulib/include/cybozu/event.hpp +122 -0
  44. data/vendor/cybozulib/include/cybozu/exception.hpp +253 -0
  45. data/vendor/cybozulib/include/cybozu/file.hpp +626 -0
  46. data/vendor/cybozulib/include/cybozu/fmindex.hpp +291 -0
  47. data/vendor/cybozulib/include/cybozu/format.hpp +93 -0
  48. data/vendor/cybozulib/include/cybozu/frequency.hpp +264 -0
  49. data/vendor/cybozulib/include/cybozu/hash.hpp +67 -0
  50. data/vendor/cybozulib/include/cybozu/inttype.hpp +174 -0
  51. data/vendor/cybozulib/include/cybozu/itoa.hpp +336 -0
  52. data/vendor/cybozulib/include/cybozu/json.hpp +120 -0
  53. data/vendor/cybozulib/include/cybozu/line_stream.hpp +149 -0
  54. data/vendor/cybozulib/include/cybozu/link_libeay32.hpp +21 -0
  55. data/vendor/cybozulib/include/cybozu/link_mpir.hpp +18 -0
  56. data/vendor/cybozulib/include/cybozu/link_ssleay32.hpp +19 -0
  57. data/vendor/cybozulib/include/cybozu/log.hpp +237 -0
  58. data/vendor/cybozulib/include/cybozu/minixml.hpp +452 -0
  59. data/vendor/cybozulib/include/cybozu/mmap.hpp +143 -0
  60. data/vendor/cybozulib/include/cybozu/mutex.hpp +144 -0
  61. data/vendor/cybozulib/include/cybozu/nlp/mecab.hpp +96 -0
  62. data/vendor/cybozulib/include/cybozu/nlp/plsi.hpp +315 -0
  63. data/vendor/cybozulib/include/cybozu/nlp/random.hpp +74 -0
  64. data/vendor/cybozulib/include/cybozu/nlp/sparse.hpp +529 -0
  65. data/vendor/cybozulib/include/cybozu/nlp/svd.hpp +486 -0
  66. data/vendor/cybozulib/include/cybozu/nlp/tfidf.hpp +226 -0
  67. data/vendor/cybozulib/include/cybozu/nlp/top_score.hpp +75 -0
  68. data/vendor/cybozulib/include/cybozu/option.hpp +743 -0
  69. data/vendor/cybozulib/include/cybozu/parallel.hpp +88 -0
  70. data/vendor/cybozulib/include/cybozu/pcg.hpp +72 -0
  71. data/vendor/cybozulib/include/cybozu/process.hpp +324 -0
  72. data/vendor/cybozulib/include/cybozu/quit_signal_handler.hpp +66 -0
  73. data/vendor/cybozulib/include/cybozu/random_generator.hpp +144 -0
  74. data/vendor/cybozulib/include/cybozu/regex.hpp +463 -0
  75. data/vendor/cybozulib/include/cybozu/select8.hpp +279 -0
  76. data/vendor/cybozulib/include/cybozu/serializer.hpp +363 -0
  77. data/vendor/cybozulib/include/cybozu/sha1.hpp +209 -0
  78. data/vendor/cybozulib/include/cybozu/sha2.hpp +506 -0
  79. data/vendor/cybozulib/include/cybozu/siphash.hpp +105 -0
  80. data/vendor/cybozulib/include/cybozu/socket.hpp +785 -0
  81. data/vendor/cybozulib/include/cybozu/ssl.hpp +203 -0
  82. data/vendor/cybozulib/include/cybozu/stacktrace.hpp +291 -0
  83. data/vendor/cybozulib/include/cybozu/stream.hpp +269 -0
  84. data/vendor/cybozulib/include/cybozu/string.hpp +1746 -0
  85. data/vendor/cybozulib/include/cybozu/string_operation.hpp +365 -0
  86. data/vendor/cybozulib/include/cybozu/sucvector.hpp +378 -0
  87. data/vendor/cybozulib/include/cybozu/test.hpp +373 -0
  88. data/vendor/cybozulib/include/cybozu/thread.hpp +229 -0
  89. data/vendor/cybozulib/include/cybozu/time.hpp +281 -0
  90. data/vendor/cybozulib/include/cybozu/tls.hpp +115 -0
  91. data/vendor/cybozulib/include/cybozu/unordered_map.hpp +13 -0
  92. data/vendor/cybozulib/include/cybozu/unordered_set.hpp +13 -0
  93. data/vendor/cybozulib/include/cybozu/v128.hpp +376 -0
  94. data/vendor/cybozulib/include/cybozu/wavelet_matrix.hpp +345 -0
  95. data/vendor/cybozulib/include/cybozu/xorshift.hpp +189 -0
  96. data/vendor/cybozulib/include/cybozu/zlib.hpp +325 -0
  97. data/vendor/cybozulib/include/sais.hxx +364 -0
  98. data/vendor/cybozulib/misc/make_select8tbl.cpp +26 -0
  99. data/vendor/cybozulib/mk.bat +37 -0
  100. data/vendor/cybozulib/readme.md +29 -0
  101. data/vendor/cybozulib/release.props +12 -0
  102. data/vendor/cybozulib/sample/Makefile +30 -0
  103. data/vendor/cybozulib/sample/csucvector_smpl.cpp +42 -0
  104. data/vendor/cybozulib/sample/data/svd/org/test1.S +4 -0
  105. data/vendor/cybozulib/sample/data/svd/org/test1.U +4 -0
  106. data/vendor/cybozulib/sample/data/svd/org/test1.V +6 -0
  107. data/vendor/cybozulib/sample/data/svd/test1 +4 -0
  108. data/vendor/cybozulib/sample/data/svd/test2 +4 -0
  109. data/vendor/cybozulib/sample/desymbol.cpp +127 -0
  110. data/vendor/cybozulib/sample/exception_smpl.cpp +46 -0
  111. data/vendor/cybozulib/sample/fmindex_smpl.cpp +231 -0
  112. data/vendor/cybozulib/sample/log_smpl.cpp +19 -0
  113. data/vendor/cybozulib/sample/mecab_smpl.cpp +37 -0
  114. data/vendor/cybozulib/sample/option2_smpl.cpp +68 -0
  115. data/vendor/cybozulib/sample/option_smpl.cpp +42 -0
  116. data/vendor/cybozulib/sample/plsi_smpl.cpp +207 -0
  117. data/vendor/cybozulib/sample/proj/exception_smpl.vcproj +184 -0
  118. data/vendor/cybozulib/sample/proj/mecab_smpl.vcproj +184 -0
  119. data/vendor/cybozulib/sample/proj/ssl_smpl/ssl_smpl.vcxproj +85 -0
  120. data/vendor/cybozulib/sample/proj/ssl_smpl.vcproj +347 -0
  121. data/vendor/cybozulib/sample/proj/stacktrace_smpl/stacktrace_smpl.vcxproj +85 -0
  122. data/vendor/cybozulib/sample/proj/svd_smpl.vcproj +184 -0
  123. data/vendor/cybozulib/sample/quit_signal_handler.cpp +30 -0
  124. data/vendor/cybozulib/sample/serializer_smpl.cpp +196 -0
  125. data/vendor/cybozulib/sample/socket_smpl.cpp +82 -0
  126. data/vendor/cybozulib/sample/ssl_smpl.cpp +39 -0
  127. data/vendor/cybozulib/sample/stacktrace_smpl.cpp +52 -0
  128. data/vendor/cybozulib/sample/svd_bench_smpl.cpp +143 -0
  129. data/vendor/cybozulib/sample/svd_smpl.cpp +94 -0
  130. data/vendor/cybozulib/sample/wm_bench_smpl.cpp +182 -0
  131. data/vendor/cybozulib/sample/zlib_smpl.cpp +41 -0
  132. data/vendor/cybozulib/src/Makefile +8 -0
  133. data/vendor/cybozulib/src/base/Makefile +19 -0
  134. data/vendor/cybozulib/test/Makefile +12 -0
  135. data/vendor/cybozulib/test/base/Makefile +37 -0
  136. data/vendor/cybozulib/test/base/array_test.cpp +173 -0
  137. data/vendor/cybozulib/test/base/atoi_test.cpp +774 -0
  138. data/vendor/cybozulib/test/base/atomic_test.cpp +49 -0
  139. data/vendor/cybozulib/test/base/base64_test.cpp +113 -0
  140. data/vendor/cybozulib/test/base/bit_operation_test.cpp +134 -0
  141. data/vendor/cybozulib/test/base/bitvector_test.cpp +204 -0
  142. data/vendor/cybozulib/test/base/condition_variable_cs_test.cpp +92 -0
  143. data/vendor/cybozulib/test/base/condition_variable_test.cpp +88 -0
  144. data/vendor/cybozulib/test/base/config_test.cpp +236 -0
  145. data/vendor/cybozulib/test/base/crypto_test.cpp +122 -0
  146. data/vendor/cybozulib/test/base/csucvector_test.cpp +63 -0
  147. data/vendor/cybozulib/test/base/csv_test.cpp +182 -0
  148. data/vendor/cybozulib/test/base/data/a.xml +26 -0
  149. data/vendor/cybozulib/test/base/endian_test.cpp +56 -0
  150. data/vendor/cybozulib/test/base/env_test.cpp +22 -0
  151. data/vendor/cybozulib/test/base/event_test.cpp +41 -0
  152. data/vendor/cybozulib/test/base/file_test.cpp +233 -0
  153. data/vendor/cybozulib/test/base/fmindex_test.cpp +118 -0
  154. data/vendor/cybozulib/test/base/format_test.cpp +12 -0
  155. data/vendor/cybozulib/test/base/frequency_test.cpp +104 -0
  156. data/vendor/cybozulib/test/base/itoa_test.cpp +522 -0
  157. data/vendor/cybozulib/test/base/line_stream_test.cpp +208 -0
  158. data/vendor/cybozulib/test/base/mecab_test.cpp +41 -0
  159. data/vendor/cybozulib/test/base/minixml_test.cpp +103 -0
  160. data/vendor/cybozulib/test/base/mmap_test.cpp +15 -0
  161. data/vendor/cybozulib/test/base/option_test.cpp +487 -0
  162. data/vendor/cybozulib/test/base/parallel_test.cpp +48 -0
  163. data/vendor/cybozulib/test/base/proj/array_test/array_test.vcxproj +86 -0
  164. data/vendor/cybozulib/test/base/proj/atoi_test/atoi_test.vcxproj +86 -0
  165. data/vendor/cybozulib/test/base/proj/atomic_test/atomic_test.vcxproj +86 -0
  166. data/vendor/cybozulib/test/base/proj/base64_test/base64_test.vcxproj +86 -0
  167. data/vendor/cybozulib/test/base/proj/condition_variable_cs_test/condition_variable_cs_test.vcxproj +86 -0
  168. data/vendor/cybozulib/test/base/proj/condition_variable_test/condition_variable_test.vcxproj +86 -0
  169. data/vendor/cybozulib/test/base/proj/config_test/config_test.vcxproj +86 -0
  170. data/vendor/cybozulib/test/base/proj/csv_test/csv_test.vcxproj +86 -0
  171. data/vendor/cybozulib/test/base/proj/endian_test/endian_test.vcxproj +86 -0
  172. data/vendor/cybozulib/test/base/proj/env_test/env_test.vcxproj +86 -0
  173. data/vendor/cybozulib/test/base/proj/event_test/event_test.vcxproj +86 -0
  174. data/vendor/cybozulib/test/base/proj/file_test/file_test.vcxproj +86 -0
  175. data/vendor/cybozulib/test/base/proj/itoa_test/itoa_test.vcxproj +86 -0
  176. data/vendor/cybozulib/test/base/proj/mecab_test/mecab_test.vcxproj +88 -0
  177. data/vendor/cybozulib/test/base/proj/minixml_test/minixml_test.vcxproj +86 -0
  178. data/vendor/cybozulib/test/base/proj/mmap_test/mmap_test.vcxproj +86 -0
  179. data/vendor/cybozulib/test/base/proj/serializer_test/serializer_test.vcxproj +86 -0
  180. data/vendor/cybozulib/test/base/proj/sha1_test/sha1_test.vcxproj +86 -0
  181. data/vendor/cybozulib/test/base/proj/stream_test/stream_test.vcxproj +86 -0
  182. data/vendor/cybozulib/test/base/proj/string_operation_test/string_operation_test.vcxproj +86 -0
  183. data/vendor/cybozulib/test/base/proj/string_test/string_test.vcxproj +86 -0
  184. data/vendor/cybozulib/test/base/proj/thread_test/thread_test.vcxproj +86 -0
  185. data/vendor/cybozulib/test/base/proj/time_test/time_test.vcxproj +86 -0
  186. data/vendor/cybozulib/test/base/proj/tls_test/tls_test.vcxproj +86 -0
  187. data/vendor/cybozulib/test/base/proj/zlib_test/zlib_test.vcxproj +86 -0
  188. data/vendor/cybozulib/test/base/random_generator_test.cpp +28 -0
  189. data/vendor/cybozulib/test/base/regex_test.cpp +74 -0
  190. data/vendor/cybozulib/test/base/serializer_test.cpp +483 -0
  191. data/vendor/cybozulib/test/base/sha1_test.cpp +61 -0
  192. data/vendor/cybozulib/test/base/sha2_test.cpp +191 -0
  193. data/vendor/cybozulib/test/base/siphash_test.cpp +33 -0
  194. data/vendor/cybozulib/test/base/socket_test.cpp +76 -0
  195. data/vendor/cybozulib/test/base/stream_test.cpp +101 -0
  196. data/vendor/cybozulib/test/base/string_operation_test.cpp +340 -0
  197. data/vendor/cybozulib/test/base/string_test.cpp +1705 -0
  198. data/vendor/cybozulib/test/base/sucvector_test.cpp +312 -0
  199. data/vendor/cybozulib/test/base/thread_test.cpp +62 -0
  200. data/vendor/cybozulib/test/base/time_test.cpp +164 -0
  201. data/vendor/cybozulib/test/base/tls_test.cpp +50 -0
  202. data/vendor/cybozulib/test/base/wavelet_matrix_test.cpp +145 -0
  203. data/vendor/cybozulib/test/base/zlib_test.cpp +371 -0
  204. data/vendor/cybozulib/test/nlp/Makefile +27 -0
  205. data/vendor/cybozulib/test/nlp/proj/random_test.vcproj +184 -0
  206. data/vendor/cybozulib/test/nlp/proj/sparse_test.vcproj +184 -0
  207. data/vendor/cybozulib/test/nlp/proj/svd_test.vcproj +184 -0
  208. data/vendor/cybozulib/test/nlp/random_test.cpp +62 -0
  209. data/vendor/cybozulib/test/nlp/sparse_test.cpp +347 -0
  210. data/vendor/cybozulib/test/nlp/svd_test.cpp +234 -0
  211. data/vendor/cybozulib/test/nlp/top_score_test.cpp +40 -0
  212. data/vendor/cybozulib/tool/create_vcproj.py +186 -0
  213. data/vendor/cybozulib/tool/vcproj_tmpl.py +185 -0
  214. data/vendor/msoffice/COPYRIGHT +27 -0
  215. data/vendor/msoffice/Makefile +29 -0
  216. data/vendor/msoffice/bin/64/msoc.dll +0 -0
  217. data/vendor/msoffice/bin/64/msocsample.exe +0 -0
  218. data/vendor/msoffice/bin/64/msoffice-crypt.exe +0 -0
  219. data/vendor/msoffice/bin/msoc.dll +0 -0
  220. data/vendor/msoffice/bin/msocsample.exe +0 -0
  221. data/vendor/msoffice/bin/msoffice-crypt.exe +0 -0
  222. data/vendor/msoffice/common.mk +71 -0
  223. data/vendor/msoffice/common.props +26 -0
  224. data/vendor/msoffice/debug.props +14 -0
  225. data/vendor/msoffice/include/attack.hpp +211 -0
  226. data/vendor/msoffice/include/cfb.hpp +777 -0
  227. data/vendor/msoffice/include/crypto_util.hpp +450 -0
  228. data/vendor/msoffice/include/custom_sha1.hpp +342 -0
  229. data/vendor/msoffice/include/decode.hpp +240 -0
  230. data/vendor/msoffice/include/encode.hpp +221 -0
  231. data/vendor/msoffice/include/make_dataspace.hpp +316 -0
  232. data/vendor/msoffice/include/msoc.h +129 -0
  233. data/vendor/msoffice/include/resource.hpp +7 -0
  234. data/vendor/msoffice/include/standard_encryption.hpp +145 -0
  235. data/vendor/msoffice/include/uint32vec.hpp +179 -0
  236. data/vendor/msoffice/include/util.hpp +212 -0
  237. data/vendor/msoffice/lib/.emptydir +0 -0
  238. data/vendor/msoffice/misc/decrypt-xls.vbs +46 -0
  239. data/vendor/msoffice/mk.bat +1 -0
  240. data/vendor/msoffice/mkdll.bat +3 -0
  241. data/vendor/msoffice/msoc.def +13 -0
  242. data/vendor/msoffice/msocsample.py +178 -0
  243. data/vendor/msoffice/msoffice12.sln +31 -0
  244. data/vendor/msoffice/readme.md +110 -0
  245. data/vendor/msoffice/release.props +28 -0
  246. data/vendor/msoffice/src/Makefile +19 -0
  247. data/vendor/msoffice/src/attack.cpp +124 -0
  248. data/vendor/msoffice/src/cfb_test.cpp +77 -0
  249. data/vendor/msoffice/src/minisample.c +54 -0
  250. data/vendor/msoffice/src/msocdll.cpp +276 -0
  251. data/vendor/msoffice/src/msocsample.c +136 -0
  252. data/vendor/msoffice/src/msoffice-crypt.cpp +219 -0
  253. data/vendor/msoffice/src/proj/attack/attack.vcxproj +88 -0
  254. data/vendor/msoffice/src/proj/main/msoffice-crypt.vcxproj +88 -0
  255. data/vendor/msoffice/src/sha1.cpp +234 -0
  256. data/vendor/msoffice/test/Makefile +20 -0
  257. data/vendor/msoffice/test/cfb_test.cpp +74 -0
  258. data/vendor/msoffice/test/hash_test.cpp +59 -0
  259. data/vendor/msoffice/test/proj/cfb/cfb_test.vcxproj +90 -0
  260. data/vendor/msoffice/test/proj/hash/hash_test.vcxproj +90 -0
  261. data/vendor/msoffice/test/sampl.bat +8 -0
  262. data/vendor/msoffice/test_all.py +46 -0
  263. data/vendor/update +4 -0
  264. metadata +351 -0
@@ -0,0 +1,182 @@
1
+ #include <cybozu/wavelet_matrix.hpp>
2
+ #include <cybozu/xorshift.hpp>
3
+ #include <algorithm>
4
+ #include <cybozu/benchmark.hpp>
5
+ #include <stdlib.h>
6
+
7
+ struct Naive {
8
+ private:
9
+ Naive(const Naive&);
10
+ void operator=(const Naive&);
11
+ public:
12
+ const std::vector<uint8_t>& v_;
13
+ explicit Naive(const std::vector<uint8_t>& v)
14
+ : v_(v)
15
+ {
16
+ }
17
+ size_t get(size_t pos) const
18
+ {
19
+ return v_[pos];
20
+ }
21
+ size_t rank(uint32_t val, size_t pos) const
22
+ {
23
+ return std::count(v_.begin(), v_.begin() + pos, val);
24
+ }
25
+ size_t rankLt(uint32_t val, size_t pos) const
26
+ {
27
+ size_t ret = 0;
28
+ for (size_t i = 0, n = pos; i < n; i++) {
29
+ if (v_[i] < val) ret++;
30
+ }
31
+ return ret;
32
+ }
33
+ size_t select(uint32_t val, size_t n) const
34
+ {
35
+ const size_t N = v_.size();
36
+ n++;
37
+ for (size_t i = 0; i < N; i++) {
38
+ if (v_[i] == val) n--;
39
+ if (n == 0) return i;
40
+ }
41
+ return cybozu::NotFound;
42
+ }
43
+ };
44
+
45
+ void add(size_t& ret, size_t x)
46
+ {
47
+ ret += x;
48
+ }
49
+
50
+ template<class T, class RG>
51
+ void bench_get(const T& wm, RG& rg, size_t N)
52
+ {
53
+ size_t ret = 0;
54
+ printf("get ");
55
+ CYBOZU_BENCH("", add, ret, wm.get(rg() & (N - 1)));
56
+ printf(" ret=%u\n", (int)ret);
57
+ }
58
+
59
+ template<class T, class RG>
60
+ void bench_rank(const T& wm, RG& rg, size_t N)
61
+ {
62
+ size_t ret = 0;
63
+ printf("rank ");
64
+ CYBOZU_BENCH("", add, ret, wm.rank(uint8_t(rg()), rg() & (N - 1)));
65
+ printf(" ret=%u\n", (int)ret);
66
+ }
67
+
68
+ template<class T, class RG>
69
+ void bench_rankLt(const T& wm, RG& rg, size_t N)
70
+ {
71
+ size_t ret = 0;
72
+ printf("rank ");
73
+ CYBOZU_BENCH("", add, ret, wm.rankLt(uint8_t(rg()), rg() & (N - 1)));
74
+ printf(" ret=%u\n", (int)ret);
75
+ }
76
+
77
+ template<class T, class RG>
78
+ void oneSelect(size_t& ret, const T& wm, RG& rg, const std::vector<int>& maxTbl)
79
+ {
80
+ uint8_t c = uint8_t(rg());
81
+ size_t pos = rg() % maxTbl[c];
82
+ ret += wm.select(c, pos);
83
+ }
84
+
85
+ template<class T, class Vec8, class RG>
86
+ void bench_select(const T& wm, const Vec8& v, RG& rg)
87
+ {
88
+ size_t ret = 0;
89
+ std::vector<int> maxTbl;
90
+ maxTbl.resize(256);
91
+ for (int i = 0; i < 256; i++) {
92
+ maxTbl[i] = (int)wm.size(i) + 1;
93
+ }
94
+ printf("select");
95
+ CYBOZU_BENCH("", oneSelect, ret, wm, rg, maxTbl);
96
+ printf(" ret=%u\n", (int)ret);
97
+ Naive nv(v);
98
+ /*
99
+ over pos=67108805, i=1024, v=58
100
+ over pos=67108841, i=1026, v=35
101
+ */
102
+ const struct {
103
+ uint8_t v;
104
+ uint64_t pos;
105
+ } tbl[] = {
106
+ { 58, 1024 },
107
+ { 35, 1026 },
108
+ };
109
+ for (size_t i = 0; i < CYBOZU_NUM_OF_ARRAY(tbl); i++) {
110
+ uint8_t c = tbl[i].v;
111
+ uint64_t pos = tbl[i].pos;
112
+ uint64_t a = nv.select(c, pos);
113
+ uint64_t b = wm.select(c, pos);
114
+ if (a != b) {
115
+ printf("ERR c=%d, pos=%d, a=%d, b=%d\n", (int)c, (int)pos, (int)a, (int)b);
116
+ exit(1);
117
+ }
118
+ }
119
+ puts("select ok");
120
+ }
121
+
122
+ template<class Vec8>
123
+ void bench(const cybozu::WaveletMatrix& wm, const Vec8& v, size_t N)
124
+ {
125
+ cybozu::XorShift rg;
126
+ puts("wm");
127
+ bench_get(wm, rg, N);
128
+ bench_rank(wm, rg, N);
129
+ bench_rankLt(wm, rg, N);
130
+ bench_select(wm, v, rg);
131
+ #if 0
132
+ bench_get(nv, "nv", 1000000, N);
133
+ bench_rank(nv, "nv", 10, N);
134
+ bench_rank_lt(nv, "nv", 10, N);
135
+ bench_select(nv, "nv", 10);
136
+ #endif
137
+ }
138
+
139
+ void run(size_t bitLen)
140
+ {
141
+ cybozu::XorShift rg;
142
+ cybozu::WaveletMatrix wm;
143
+ const size_t N = size_t(1) << bitLen;
144
+ printf("%09llx\n", (long long)N);
145
+ puts("init");
146
+ std::vector<uint8_t> v;
147
+ v.resize(N);
148
+ for (size_t i = 0; i < N; i++) {
149
+ v[i] = uint8_t(rg());
150
+ }
151
+ #if 0
152
+ printf("v\n");
153
+ for (size_t i = 0; i < N; i++) {
154
+ printf("%d ", v[i]);
155
+ }
156
+ printf("\n");
157
+ #endif
158
+ wm.init(v, 8);
159
+ puts("start");
160
+ bench(wm, v, N);
161
+ }
162
+
163
+ int main(int argc, char *argv[])
164
+ try
165
+ {
166
+ size_t bitLen = 26;
167
+ argc--, argv++;
168
+ while (argc > 0) {
169
+ if (argc > 1 && strcmp(*argv, "-b") == 0) {
170
+ argc--, argv++;
171
+ bitLen = atoi(*argv);
172
+ } else
173
+ {
174
+ printf("usage wm_bench_smpl.exe [-b bitLen]\n");
175
+ return 1;
176
+ }
177
+ argc--, argv++;
178
+ }
179
+ run(bitLen);
180
+ } catch (std::exception& e) {
181
+ printf("err %s\n", e.what());
182
+ }
@@ -0,0 +1,41 @@
1
+ #include <cybozu/zlib.hpp>
2
+ #include <cybozu/option.hpp>
3
+ #include <cybozu/mmap.hpp>
4
+ #include <fstream>
5
+
6
+ int main(int argc, char *argv[])
7
+ try
8
+ {
9
+ bool doUncomp = false;
10
+ std::string inFile;
11
+ std::string outFile;
12
+ cybozu::Option opt;
13
+ opt.appendBoolOpt(&doUncomp, "d", ": uncompress");
14
+ opt.appendParam(&inFile, "input file");
15
+ opt.appendParam(&outFile, "output file");
16
+ opt.appendHelp("h", ": show thismessage");
17
+ if (!opt.parse(argc, argv)) {
18
+ opt.usage();
19
+ return 0;
20
+ }
21
+ cybozu::Mmap f(inFile);
22
+ std::string out;
23
+ if (doUncomp) {
24
+ out.resize(f.size() * 10);
25
+ size_t size = cybozu::ZlibUncompress(&out[0], out.size(), f.get(), f.size());
26
+ out.resize(size);
27
+ } else {
28
+ out.resize(f.size());
29
+ size_t size = cybozu::ZlibCompress(&out[0], out.size(), f.get(), f.size());
30
+ if (size == 0) {
31
+ fprintf(stderr, "not compress\n");
32
+ return 1;
33
+ }
34
+ out.resize(size);
35
+ }
36
+ std::ofstream ofs(outFile.c_str(), std::ios::binary);
37
+ ofs.write(out.data(), out.size());
38
+ } catch (std::exception& e) {
39
+ fprintf(stderr, "ERR %s\n", e.what());
40
+ return 1;
41
+ }
@@ -0,0 +1,8 @@
1
+
2
+ all:
3
+ $(MAKE) -C base
4
+
5
+ clean:
6
+ $(MAKE) -C base clean
7
+
8
+
@@ -0,0 +1,19 @@
1
+ include ../../common.mk
2
+
3
+ #TARGET=../../lib/libcybozu_base$(OBJSUF).a
4
+ TARGET=
5
+ SRC=
6
+
7
+ all: $(TARGET)
8
+
9
+ $(TARGET): $(OBJS)
10
+ $(AR) $@ $(OBJS)
11
+
12
+ $(OBJDIR):
13
+ @$(MKDIR) $(OBJDIR)
14
+
15
+ clean:
16
+ $(CLEAN)
17
+
18
+ -include $(DEPEND_FILE)
19
+
@@ -0,0 +1,12 @@
1
+
2
+ all:
3
+ $(MAKE) -C base
4
+ $(MAKE) -C nlp
5
+
6
+ test:
7
+ $(MAKE) -C base test
8
+ $(MAKE) -C nlp test
9
+ clean:
10
+ $(MAKE) -C base clean
11
+ $(MAKE) -C nlp clean
12
+
@@ -0,0 +1,37 @@
1
+ include ../../common.mk
2
+
3
+ TARGET=$(TEST_FILE)
4
+ #LIBS=$(TOPDIR)lib/libcybozu_base$(OBJSUF).a
5
+ LIBS=
6
+
7
+ SRC=$(wildcard *.cpp)
8
+ ifneq ($(HAS_BOOST),1)
9
+ SRC:=$(filter-out regex_test.cpp,$(SRC))
10
+ endif
11
+ #ifneq ($(HAS_MECAB),1)
12
+ SRC:=$(filter-out mecab_test.cpp,$(SRC))
13
+ #endif
14
+ ifeq ($(TRAVIS_TEST),1)
15
+ SRC:=$(filter-out env_test.cpp,$(SRC))
16
+ SRC:=$(filter-out fmindex_test.cpp,$(SRC))
17
+ SRC:=$(filter-out mmap_test.cpp,$(SRC))
18
+ SRC:=$(filter-out minixml_test.cpp,$(SRC))
19
+ SRC:=$(filter-out zlib_test.cpp,$(SRC))
20
+ endif
21
+
22
+ all: $(TARGET)
23
+
24
+ test: $(TARGET)
25
+ @$(UNIT_TEST)
26
+
27
+ $(OBJDIR):
28
+ @$(MKDIR) $(OBJDIR)
29
+
30
+ clean:
31
+ $(CLEAN)
32
+
33
+ $(LIBS):
34
+ $(MAKE) -C ../../src
35
+
36
+ -include $(DEPEND_FILE)
37
+
@@ -0,0 +1,173 @@
1
+ /*
2
+ debug for AlignedAlloc with doClear = false
3
+ */
4
+ #include <cybozu/array.hpp>
5
+ #include <cybozu/test.hpp>
6
+
7
+ int a_count = 0;
8
+ int b_count = 0;
9
+
10
+ struct A {
11
+ int n;
12
+ A()
13
+ : n(a_count)
14
+ {
15
+ a_count++;
16
+ }
17
+ ~A()
18
+ {
19
+ a_count--;
20
+ }
21
+ };
22
+
23
+ struct B {
24
+ std::string x;
25
+ B()
26
+ {
27
+ if (b_count == 3) throw std::bad_exception();
28
+ b_count++;
29
+ x = "dummy";
30
+ }
31
+ ~B()
32
+ {
33
+ b_count--;
34
+ }
35
+ };
36
+
37
+ CYBOZU_TEST_AUTO(scoped_array)
38
+ {
39
+ {
40
+ cybozu::ScopedArray<A> a(10);
41
+ CYBOZU_TEST_EQUAL(a_count, 10);
42
+ for (int i = 0; i < 10; i++) {
43
+ CYBOZU_TEST_EQUAL(a[i].n, i);
44
+ CYBOZU_TEST_EQUAL(a.data()[i].n, i);
45
+ }
46
+ }
47
+ CYBOZU_TEST_EQUAL(a_count, 0);
48
+ }
49
+
50
+ bool isAligned(const void *p, size_t alignSize)
51
+ {
52
+ return (uintptr_t(p) & (alignSize - 1)) == 0;
53
+ }
54
+
55
+ CYBOZU_TEST_AUTO(aligned_array)
56
+ {
57
+ cybozu::AlignedArray<int> a(10);
58
+ CYBOZU_TEST_EQUAL(a.size(), 10);
59
+ CYBOZU_TEST_ASSERT(isAligned(&a[0], 16));
60
+ for (int i = 0; i < 10; i++) {
61
+ CYBOZU_TEST_EQUAL(a[i], 0);
62
+ CYBOZU_TEST_EQUAL(a.data()[i], 0);
63
+ }
64
+ }
65
+
66
+ CYBOZU_TEST_AUTO(aligned_array_char)
67
+ {
68
+ cybozu::AlignedArray<char> a(51);
69
+ CYBOZU_TEST_ASSERT(isAligned(&a[0], 16));
70
+ for (size_t i = 0; i < a.size(); i++) {
71
+ CYBOZU_TEST_EQUAL(a[i], 0);
72
+ }
73
+ }
74
+
75
+ CYBOZU_TEST_AUTO(resize)
76
+ {
77
+ cybozu::AlignedArray<char> a(10);
78
+ CYBOZU_TEST_EQUAL(a.size(), 10);
79
+ CYBOZU_TEST_ASSERT(isAligned(&a[0], 16));
80
+ for (size_t i = 0; i < 10; i++) {
81
+ a[i] = (char)i;
82
+ }
83
+ a.resize(20);
84
+ CYBOZU_TEST_EQUAL(a.size(), 20);
85
+ CYBOZU_TEST_ASSERT(isAligned(&a[0], 16));
86
+ for (size_t i = 0; i < 10; i++) {
87
+ CYBOZU_TEST_EQUAL(a[i], (char)i);
88
+ }
89
+ for (size_t i = 10; i < 20; i++) {
90
+ CYBOZU_TEST_EQUAL(a[i], (char)0);
91
+ }
92
+ const char *p = &a[0];
93
+ a.resize(4);
94
+ CYBOZU_TEST_EQUAL(a.size(), 4);
95
+ CYBOZU_TEST_EQUAL(&a[0], p);
96
+ for (size_t i = 0; i < 4; i++) {
97
+ CYBOZU_TEST_EQUAL(a[i], (char)i);
98
+ }
99
+ CYBOZU_TEST_ASSERT(!a.empty());
100
+ a.resize(0);
101
+ CYBOZU_TEST_EQUAL(a.size(), 0);
102
+ CYBOZU_TEST_ASSERT(a.empty());
103
+ a.resize(20);
104
+ CYBOZU_TEST_EQUAL(a.size(), 20);
105
+ CYBOZU_TEST_EQUAL(&a[0], p); // same pointer until resize(20)
106
+ a.resize(21);
107
+ CYBOZU_TEST_EQUAL(a.size(), 21);
108
+ CYBOZU_TEST_ASSERT(&a[0] != p); // different pointer
109
+ }
110
+
111
+ CYBOZU_TEST_AUTO(AlignedArray_copy)
112
+ {
113
+ cybozu::AlignedArray<int> x, z, y;
114
+ x.resize(10);
115
+ for (size_t i = 0; i < x.size(); i++) x[i] = (int)i;
116
+ y.resize(5);
117
+
118
+ y = x;
119
+ z = x;
120
+ cybozu::AlignedArray<int> w(x);
121
+ CYBOZU_TEST_EQUAL_ARRAY(x.data(), y.data(), x.size());
122
+ CYBOZU_TEST_EQUAL_ARRAY(x.data(), z.data(), x.size());
123
+ CYBOZU_TEST_EQUAL_ARRAY(x.data(), w.data(), x.size());
124
+
125
+ w.resize(25);
126
+ for (size_t i = 0; i < w.size(); i++) w[i] = (int)i + 123;
127
+ w = x;
128
+ CYBOZU_TEST_EQUAL_ARRAY(x.data(), w.data(), x.size());
129
+ }
130
+
131
+ #if (CYBOZU_CPP_VERSION == CYBOZU_CPP_VERSION_CPP11)
132
+ CYBOZU_TEST_AUTO(AlignedArray_move)
133
+ {
134
+ cybozu::AlignedArray<long> x, y;
135
+ x.resize(10);
136
+ y.resize(5);
137
+ const long* px = x.data();
138
+ const long* py = y.data();
139
+ CYBOZU_TEST_EQUAL(x.size(), 10);
140
+ CYBOZU_TEST_EQUAL(y.size(), 5);
141
+ for (size_t i = 0; i < x.size(); i++) {
142
+ x[i] = (long)i;
143
+ }
144
+ for (size_t i = 0; i < y.size(); i++) {
145
+ y[i] = (long)i + 10;
146
+ }
147
+ for (size_t i = 0; i < x.size(); i++) {
148
+ CYBOZU_TEST_EQUAL(x[i], (long)i);
149
+ }
150
+ for (size_t i = 0; i < y.size(); i++) {
151
+ CYBOZU_TEST_EQUAL(y[i], 10 + (long)i);
152
+ }
153
+ cybozu::AlignedArray<long> z(std::move(x));
154
+ const long* pz = &z[0];
155
+ CYBOZU_TEST_EQUAL(pz, px);
156
+ CYBOZU_TEST_EQUAL(x.data(), (long*)0);
157
+ CYBOZU_TEST_EQUAL(z.data(), px);
158
+ CYBOZU_TEST_EQUAL(z.size(), 10);
159
+ for (size_t i = 0; i < 10; i++) {
160
+ CYBOZU_TEST_EQUAL(z[i], (long)i);
161
+ }
162
+ CYBOZU_TEST_EQUAL(x.size(), 0);
163
+
164
+ z = std::move(y);
165
+ CYBOZU_TEST_EQUAL(py, &z[0]);
166
+ CYBOZU_TEST_EQUAL(py, z.data());
167
+ CYBOZU_TEST_EQUAL(y.size(), 0);
168
+ CYBOZU_TEST_EQUAL(z.size(), 5);
169
+ for (size_t i = 0; i < 5; i++) {
170
+ CYBOZU_TEST_EQUAL(z[i], 10 + (long)i);
171
+ }
172
+ }
173
+ #endif