datasketches 0.3.2 → 0.4.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +6 -0
- data/NOTICE +1 -1
- data/README.md +0 -2
- data/ext/datasketches/cpc_wrapper.cpp +2 -2
- data/ext/datasketches/kll_wrapper.cpp +0 -10
- data/lib/datasketches/version.rb +1 -1
- data/lib/datasketches.rb +1 -1
- data/vendor/datasketches-cpp/CMakeLists.txt +1 -0
- data/vendor/datasketches-cpp/CODE_OF_CONDUCT.md +3 -0
- data/vendor/datasketches-cpp/CONTRIBUTING.md +50 -0
- data/vendor/datasketches-cpp/Doxyfile +2827 -0
- data/vendor/datasketches-cpp/LICENSE +0 -76
- data/vendor/datasketches-cpp/NOTICE +1 -1
- data/vendor/datasketches-cpp/README.md +1 -3
- data/vendor/datasketches-cpp/common/CMakeLists.txt +12 -11
- data/vendor/datasketches-cpp/common/include/common_defs.hpp +11 -8
- data/vendor/datasketches-cpp/common/include/count_zeros.hpp +0 -2
- data/vendor/datasketches-cpp/common/include/kolmogorov_smirnov.hpp +9 -6
- data/vendor/datasketches-cpp/common/include/optional.hpp +148 -0
- data/vendor/datasketches-cpp/common/include/quantiles_sorted_view.hpp +95 -2
- data/vendor/datasketches-cpp/common/include/quantiles_sorted_view_impl.hpp +1 -1
- data/vendor/datasketches-cpp/common/include/serde.hpp +69 -20
- data/vendor/datasketches-cpp/common/test/CMakeLists.txt +1 -1
- data/vendor/datasketches-cpp/common/test/optional_test.cpp +85 -0
- data/vendor/datasketches-cpp/common/test/test_allocator.hpp +14 -14
- data/vendor/datasketches-cpp/count/include/count_min.hpp +132 -78
- data/vendor/datasketches-cpp/count/include/count_min_impl.hpp +132 -152
- data/vendor/datasketches-cpp/count/test/CMakeLists.txt +11 -12
- data/vendor/datasketches-cpp/count/test/count_min_allocation_test.cpp +61 -61
- data/vendor/datasketches-cpp/count/test/count_min_test.cpp +175 -178
- data/vendor/datasketches-cpp/cpc/include/cpc_common.hpp +14 -20
- data/vendor/datasketches-cpp/cpc/include/cpc_compressor.hpp +7 -4
- data/vendor/datasketches-cpp/cpc/include/cpc_compressor_impl.hpp +17 -17
- data/vendor/datasketches-cpp/cpc/include/cpc_sketch.hpp +40 -40
- data/vendor/datasketches-cpp/cpc/include/cpc_sketch_impl.hpp +13 -10
- data/vendor/datasketches-cpp/cpc/include/cpc_union.hpp +35 -11
- data/vendor/datasketches-cpp/cpc/include/cpc_union_impl.hpp +8 -8
- data/vendor/datasketches-cpp/cpc/include/u32_table.hpp +3 -2
- data/vendor/datasketches-cpp/cpc/include/u32_table_impl.hpp +5 -5
- data/vendor/datasketches-cpp/cpc/test/CMakeLists.txt +20 -7
- data/vendor/datasketches-cpp/cpc/test/cpc_sketch_deserialize_from_java_test.cpp +60 -0
- data/vendor/datasketches-cpp/{python/include/py_object_lt.hpp → cpc/test/cpc_sketch_serialize_for_java.cpp} +15 -14
- data/vendor/datasketches-cpp/cpc/test/cpc_sketch_test.cpp +4 -29
- data/vendor/datasketches-cpp/cpc/test/cpc_union_test.cpp +4 -4
- data/vendor/datasketches-cpp/density/include/density_sketch.hpp +29 -9
- data/vendor/datasketches-cpp/density/include/density_sketch_impl.hpp +1 -1
- data/vendor/datasketches-cpp/density/test/CMakeLists.txt +0 -1
- data/vendor/datasketches-cpp/fi/include/frequent_items_sketch.hpp +21 -9
- data/vendor/datasketches-cpp/fi/include/frequent_items_sketch_impl.hpp +6 -4
- data/vendor/datasketches-cpp/fi/test/CMakeLists.txt +14 -1
- data/vendor/datasketches-cpp/fi/test/frequent_items_sketch_deserialize_from_java_test.cpp +95 -0
- data/vendor/datasketches-cpp/fi/test/frequent_items_sketch_serialize_for_java.cpp +83 -0
- data/vendor/datasketches-cpp/fi/test/frequent_items_sketch_test.cpp +3 -42
- data/vendor/datasketches-cpp/hll/include/CouponList-internal.hpp +2 -2
- data/vendor/datasketches-cpp/hll/include/CouponList.hpp +3 -1
- data/vendor/datasketches-cpp/hll/include/HllArray-internal.hpp +3 -3
- data/vendor/datasketches-cpp/hll/include/HllArray.hpp +5 -3
- data/vendor/datasketches-cpp/hll/include/HllSketch-internal.hpp +4 -4
- data/vendor/datasketches-cpp/hll/include/HllSketchImpl.hpp +3 -1
- data/vendor/datasketches-cpp/hll/include/HllUtil.hpp +0 -12
- data/vendor/datasketches-cpp/hll/include/hll.hpp +70 -57
- data/vendor/datasketches-cpp/hll/test/CMakeLists.txt +14 -1
- data/vendor/datasketches-cpp/hll/test/ToFromByteArrayTest.cpp +0 -68
- data/vendor/datasketches-cpp/hll/test/hll_sketch_deserialize_from_java_test.cpp +69 -0
- data/vendor/datasketches-cpp/hll/test/hll_sketch_serialize_for_java.cpp +52 -0
- data/vendor/datasketches-cpp/kll/include/kll_helper_impl.hpp +2 -2
- data/vendor/datasketches-cpp/kll/include/kll_sketch.hpp +71 -50
- data/vendor/datasketches-cpp/kll/include/kll_sketch_impl.hpp +59 -130
- data/vendor/datasketches-cpp/kll/test/CMakeLists.txt +14 -1
- data/vendor/datasketches-cpp/kll/test/kll_sketch_deserialize_from_java_test.cpp +103 -0
- data/vendor/datasketches-cpp/kll/test/kll_sketch_serialize_for_java.cpp +62 -0
- data/vendor/datasketches-cpp/kll/test/kll_sketch_test.cpp +3 -38
- data/vendor/datasketches-cpp/quantiles/include/quantiles_sketch.hpp +68 -51
- data/vendor/datasketches-cpp/quantiles/include/quantiles_sketch_impl.hpp +62 -132
- data/vendor/datasketches-cpp/quantiles/test/CMakeLists.txt +14 -1
- data/vendor/datasketches-cpp/quantiles/test/quantiles_sketch_deserialize_from_java_test.cpp +84 -0
- data/vendor/datasketches-cpp/quantiles/test/quantiles_sketch_serialize_for_java.cpp +52 -0
- data/vendor/datasketches-cpp/quantiles/test/quantiles_sketch_test.cpp +14 -38
- data/vendor/datasketches-cpp/req/include/req_common.hpp +7 -3
- data/vendor/datasketches-cpp/req/include/req_compactor_impl.hpp +2 -2
- data/vendor/datasketches-cpp/req/include/req_sketch.hpp +97 -23
- data/vendor/datasketches-cpp/req/include/req_sketch_impl.hpp +48 -109
- data/vendor/datasketches-cpp/req/test/CMakeLists.txt +14 -1
- data/vendor/datasketches-cpp/req/test/req_sketch_deserialize_from_java_test.cpp +55 -0
- data/vendor/datasketches-cpp/{tuple/include/array_of_doubles_intersection_impl.hpp → req/test/req_sketch_serialize_for_java.cpp} +12 -7
- data/vendor/datasketches-cpp/req/test/req_sketch_test.cpp +3 -89
- data/vendor/datasketches-cpp/sampling/CMakeLists.txt +4 -0
- data/vendor/datasketches-cpp/sampling/include/ebpps_sample.hpp +210 -0
- data/vendor/datasketches-cpp/sampling/include/ebpps_sample_impl.hpp +535 -0
- data/vendor/datasketches-cpp/sampling/include/ebpps_sketch.hpp +281 -0
- data/vendor/datasketches-cpp/sampling/include/ebpps_sketch_impl.hpp +531 -0
- data/vendor/datasketches-cpp/sampling/include/var_opt_sketch.hpp +69 -26
- data/vendor/datasketches-cpp/sampling/include/var_opt_sketch_impl.hpp +3 -3
- data/vendor/datasketches-cpp/sampling/include/var_opt_union.hpp +10 -11
- data/vendor/datasketches-cpp/sampling/include/var_opt_union_impl.hpp +4 -4
- data/vendor/datasketches-cpp/sampling/test/CMakeLists.txt +55 -8
- data/vendor/datasketches-cpp/sampling/test/ebpps_allocation_test.cpp +96 -0
- data/vendor/datasketches-cpp/sampling/test/ebpps_sample_test.cpp +137 -0
- data/vendor/datasketches-cpp/sampling/test/ebpps_sketch_test.cpp +266 -0
- data/vendor/datasketches-cpp/sampling/test/var_opt_sketch_deserialize_from_java_test.cpp +81 -0
- data/vendor/datasketches-cpp/sampling/test/var_opt_sketch_serialize_for_java.cpp +54 -0
- data/vendor/datasketches-cpp/sampling/test/var_opt_sketch_test.cpp +0 -37
- data/vendor/datasketches-cpp/sampling/test/var_opt_union_deserialize_from_java_test.cpp +50 -0
- data/vendor/datasketches-cpp/sampling/test/var_opt_union_serialize_for_java.cpp +56 -0
- data/vendor/datasketches-cpp/sampling/test/var_opt_union_test.cpp +0 -18
- data/vendor/datasketches-cpp/theta/include/bit_packing.hpp +2608 -2608
- data/vendor/datasketches-cpp/theta/include/bounds_on_ratios_in_sampled_sets.hpp +1 -0
- data/vendor/datasketches-cpp/theta/include/bounds_on_ratios_in_theta_sketched_sets.hpp +7 -6
- data/vendor/datasketches-cpp/theta/include/theta_a_not_b.hpp +20 -5
- data/vendor/datasketches-cpp/theta/include/theta_constants.hpp +10 -4
- data/vendor/datasketches-cpp/theta/include/theta_helpers.hpp +1 -1
- data/vendor/datasketches-cpp/theta/include/theta_intersection.hpp +13 -5
- data/vendor/datasketches-cpp/theta/include/theta_intersection_base_impl.hpp +5 -5
- data/vendor/datasketches-cpp/theta/include/theta_intersection_impl.hpp +3 -3
- data/vendor/datasketches-cpp/theta/include/theta_jaccard_similarity.hpp +2 -1
- data/vendor/datasketches-cpp/theta/include/theta_jaccard_similarity_base.hpp +1 -0
- data/vendor/datasketches-cpp/theta/include/theta_set_difference_base_impl.hpp +1 -1
- data/vendor/datasketches-cpp/theta/include/theta_sketch.hpp +126 -27
- data/vendor/datasketches-cpp/theta/include/theta_sketch_impl.hpp +8 -8
- data/vendor/datasketches-cpp/theta/include/theta_union.hpp +17 -10
- data/vendor/datasketches-cpp/theta/include/theta_union_base_impl.hpp +1 -1
- data/vendor/datasketches-cpp/theta/include/theta_union_impl.hpp +3 -3
- data/vendor/datasketches-cpp/theta/include/theta_update_sketch_base.hpp +5 -2
- data/vendor/datasketches-cpp/theta/include/theta_update_sketch_base_impl.hpp +11 -1
- data/vendor/datasketches-cpp/theta/test/CMakeLists.txt +14 -1
- data/vendor/datasketches-cpp/theta/test/theta_sketch_deserialize_from_java_test.cpp +57 -0
- data/vendor/datasketches-cpp/theta/test/theta_sketch_serialize_for_java.cpp +61 -0
- data/vendor/datasketches-cpp/theta/test/theta_sketch_test.cpp +0 -188
- data/vendor/datasketches-cpp/tuple/CMakeLists.txt +8 -7
- data/vendor/datasketches-cpp/tuple/include/array_of_doubles_sketch.hpp +19 -144
- data/vendor/datasketches-cpp/tuple/include/{array_of_doubles_a_not_b.hpp → array_tuple_a_not_b.hpp} +24 -16
- data/vendor/datasketches-cpp/tuple/include/{array_of_doubles_a_not_b_impl.hpp → array_tuple_a_not_b_impl.hpp} +4 -4
- data/vendor/datasketches-cpp/tuple/include/array_tuple_intersection.hpp +65 -0
- data/vendor/datasketches-cpp/{python/include/py_object_ostream.hpp → tuple/include/array_tuple_intersection_impl.hpp} +7 -24
- data/vendor/datasketches-cpp/tuple/include/array_tuple_sketch.hpp +237 -0
- data/vendor/datasketches-cpp/tuple/include/{array_of_doubles_sketch_impl.hpp → array_tuple_sketch_impl.hpp} +40 -41
- data/vendor/datasketches-cpp/tuple/include/array_tuple_union.hpp +81 -0
- data/vendor/datasketches-cpp/tuple/include/array_tuple_union_impl.hpp +43 -0
- data/vendor/datasketches-cpp/tuple/include/tuple_a_not_b.hpp +11 -2
- data/vendor/datasketches-cpp/tuple/include/tuple_intersection.hpp +17 -10
- data/vendor/datasketches-cpp/tuple/include/tuple_jaccard_similarity.hpp +2 -1
- data/vendor/datasketches-cpp/tuple/include/tuple_sketch.hpp +95 -32
- data/vendor/datasketches-cpp/tuple/include/tuple_union.hpp +19 -11
- data/vendor/datasketches-cpp/tuple/test/CMakeLists.txt +16 -1
- data/vendor/datasketches-cpp/tuple/test/aod_sketch_deserialize_from_java_test.cpp +76 -0
- data/vendor/datasketches-cpp/tuple/test/aod_sketch_serialize_for_java.cpp +62 -0
- data/vendor/datasketches-cpp/tuple/test/array_of_doubles_sketch_test.cpp +5 -129
- data/vendor/datasketches-cpp/tuple/test/engagement_test.cpp +85 -89
- data/vendor/datasketches-cpp/tuple/test/tuple_jaccard_similarity_test.cpp +3 -1
- data/vendor/datasketches-cpp/tuple/test/tuple_sketch_deserialize_from_java_test.cpp +47 -0
- data/vendor/datasketches-cpp/tuple/test/tuple_sketch_serialize_for_java.cpp +38 -0
- data/vendor/datasketches-cpp/tuple/test/tuple_sketch_test.cpp +1 -1
- data/vendor/datasketches-cpp/version.cfg.in +1 -1
- metadata +47 -93
- data/vendor/datasketches-cpp/MANIFEST.in +0 -39
- data/vendor/datasketches-cpp/fi/test/items_sketch_string_from_java.sk +0 -0
- data/vendor/datasketches-cpp/fi/test/items_sketch_string_utf8_from_java.sk +0 -0
- data/vendor/datasketches-cpp/fi/test/longs_sketch_from_java.sk +0 -0
- data/vendor/datasketches-cpp/hll/test/array6_from_java.sk +0 -0
- data/vendor/datasketches-cpp/hll/test/compact_array4_from_java.sk +0 -0
- data/vendor/datasketches-cpp/hll/test/compact_set_from_java.sk +0 -0
- data/vendor/datasketches-cpp/hll/test/list_from_java.sk +0 -0
- data/vendor/datasketches-cpp/hll/test/updatable_array4_from_java.sk +0 -0
- data/vendor/datasketches-cpp/hll/test/updatable_set_from_java.sk +0 -0
- data/vendor/datasketches-cpp/kll/test/kll_sketch_from_java.sk +0 -0
- data/vendor/datasketches-cpp/pyproject.toml +0 -23
- data/vendor/datasketches-cpp/python/CMakeLists.txt +0 -87
- data/vendor/datasketches-cpp/python/README.md +0 -85
- data/vendor/datasketches-cpp/python/datasketches/DensityWrapper.py +0 -87
- data/vendor/datasketches-cpp/python/datasketches/KernelFunction.py +0 -35
- data/vendor/datasketches-cpp/python/datasketches/PySerDe.py +0 -110
- data/vendor/datasketches-cpp/python/datasketches/TuplePolicy.py +0 -77
- data/vendor/datasketches-cpp/python/datasketches/TupleWrapper.py +0 -205
- data/vendor/datasketches-cpp/python/datasketches/__init__.py +0 -38
- data/vendor/datasketches-cpp/python/include/kernel_function.hpp +0 -98
- data/vendor/datasketches-cpp/python/include/py_serde.hpp +0 -113
- data/vendor/datasketches-cpp/python/include/quantile_conditional.hpp +0 -104
- data/vendor/datasketches-cpp/python/include/tuple_policy.hpp +0 -136
- data/vendor/datasketches-cpp/python/jupyter/CPCSketch.ipynb +0 -345
- data/vendor/datasketches-cpp/python/jupyter/FrequentItemsSketch.ipynb +0 -354
- data/vendor/datasketches-cpp/python/jupyter/HLLSketch.ipynb +0 -346
- data/vendor/datasketches-cpp/python/jupyter/KLLSketch.ipynb +0 -463
- data/vendor/datasketches-cpp/python/jupyter/ThetaSketchNotebook.ipynb +0 -403
- data/vendor/datasketches-cpp/python/pybind11Path.cmd +0 -21
- data/vendor/datasketches-cpp/python/src/__init__.py +0 -18
- data/vendor/datasketches-cpp/python/src/count_wrapper.cpp +0 -101
- data/vendor/datasketches-cpp/python/src/cpc_wrapper.cpp +0 -76
- data/vendor/datasketches-cpp/python/src/datasketches.cpp +0 -58
- data/vendor/datasketches-cpp/python/src/density_wrapper.cpp +0 -95
- data/vendor/datasketches-cpp/python/src/fi_wrapper.cpp +0 -182
- data/vendor/datasketches-cpp/python/src/hll_wrapper.cpp +0 -126
- data/vendor/datasketches-cpp/python/src/kll_wrapper.cpp +0 -158
- data/vendor/datasketches-cpp/python/src/ks_wrapper.cpp +0 -68
- data/vendor/datasketches-cpp/python/src/py_serde.cpp +0 -112
- data/vendor/datasketches-cpp/python/src/quantiles_wrapper.cpp +0 -155
- data/vendor/datasketches-cpp/python/src/req_wrapper.cpp +0 -154
- data/vendor/datasketches-cpp/python/src/theta_wrapper.cpp +0 -166
- data/vendor/datasketches-cpp/python/src/tuple_wrapper.cpp +0 -215
- data/vendor/datasketches-cpp/python/src/vector_of_kll.cpp +0 -490
- data/vendor/datasketches-cpp/python/src/vo_wrapper.cpp +0 -173
- data/vendor/datasketches-cpp/python/tests/__init__.py +0 -16
- data/vendor/datasketches-cpp/python/tests/count_min_test.py +0 -86
- data/vendor/datasketches-cpp/python/tests/cpc_test.py +0 -64
- data/vendor/datasketches-cpp/python/tests/density_test.py +0 -93
- data/vendor/datasketches-cpp/python/tests/fi_test.py +0 -149
- data/vendor/datasketches-cpp/python/tests/hll_test.py +0 -129
- data/vendor/datasketches-cpp/python/tests/kll_test.py +0 -159
- data/vendor/datasketches-cpp/python/tests/quantiles_test.py +0 -160
- data/vendor/datasketches-cpp/python/tests/req_test.py +0 -159
- data/vendor/datasketches-cpp/python/tests/theta_test.py +0 -148
- data/vendor/datasketches-cpp/python/tests/tuple_test.py +0 -206
- data/vendor/datasketches-cpp/python/tests/vector_of_kll_test.py +0 -148
- data/vendor/datasketches-cpp/python/tests/vo_test.py +0 -132
- data/vendor/datasketches-cpp/req/test/req_float_empty_from_java.sk +0 -0
- data/vendor/datasketches-cpp/req/test/req_float_estimation_from_java.sk +0 -0
- data/vendor/datasketches-cpp/req/test/req_float_exact_from_java.sk +0 -0
- data/vendor/datasketches-cpp/req/test/req_float_raw_items_from_java.sk +0 -0
- data/vendor/datasketches-cpp/req/test/req_float_single_item_from_java.sk +0 -0
- data/vendor/datasketches-cpp/sampling/test/binaries_from_java.txt +0 -67
- data/vendor/datasketches-cpp/sampling/test/varopt_sketch_long_sampling.sk +0 -0
- data/vendor/datasketches-cpp/sampling/test/varopt_sketch_string_exact.sk +0 -0
- data/vendor/datasketches-cpp/sampling/test/varopt_union_double_sampling.sk +0 -0
- data/vendor/datasketches-cpp/setup.py +0 -110
- data/vendor/datasketches-cpp/theta/test/theta_compact_empty_from_java.sk +0 -0
- data/vendor/datasketches-cpp/theta/test/theta_compact_estimation_from_java.sk +0 -0
- data/vendor/datasketches-cpp/theta/test/theta_compact_exact_from_java.sk +0 -0
- data/vendor/datasketches-cpp/theta/test/theta_compact_single_item_from_java.sk +0 -0
- data/vendor/datasketches-cpp/tox.ini +0 -26
- data/vendor/datasketches-cpp/tuple/include/array_of_doubles_intersection.hpp +0 -52
- data/vendor/datasketches-cpp/tuple/include/array_of_doubles_union.hpp +0 -81
- data/vendor/datasketches-cpp/tuple/include/array_of_doubles_union_impl.hpp +0 -43
- data/vendor/datasketches-cpp/tuple/test/aod_1_compact_empty_from_java.sk +0 -1
- data/vendor/datasketches-cpp/tuple/test/aod_1_compact_estimation_from_java.sk +0 -0
- data/vendor/datasketches-cpp/tuple/test/aod_1_compact_non_empty_no_entries_from_java.sk +0 -0
- data/vendor/datasketches-cpp/tuple/test/aod_2_compact_exact_from_java.sk +0 -0
- data/vendor/datasketches-cpp/tuple/test/aod_3_compact_empty_from_java.sk +0 -1
@@ -205,7 +205,6 @@ APPENDIX A: How to apply the Apache License to your work.
|
|
205
205
|
-------------------------------------------------------------
|
206
206
|
|
207
207
|
|
208
|
-
|
209
208
|
APPENDIX B: Additional licenses relevant to this product.
|
210
209
|
|
211
210
|
This product includes a number of source files with code that has been
|
@@ -215,43 +214,6 @@ APPENDIX B: Additional licenses relevant to this product.
|
|
215
214
|
conditions of the following licenses.
|
216
215
|
|
217
216
|
|
218
|
-
|
219
|
-
=============================================================
|
220
|
-
MIT License
|
221
|
-
=============================================================
|
222
|
-
Original source code:
|
223
|
-
https://github.com/benjaminjack/python_cpp_example
|
224
|
-
-------------------------------------------------------------
|
225
|
-
Copyright (c) 2017 Benjamin R. Jack
|
226
|
-
|
227
|
-
MIT License (https://opensource.org/licenses/MIT):
|
228
|
-
|
229
|
-
Permission is hereby granted, free of charge, to any person
|
230
|
-
obtaining a copy of this software and associated documentation
|
231
|
-
files (the "Software"), to deal in the Software without restriction,
|
232
|
-
including without limitation the rights to use, copy, modify, merge,
|
233
|
-
publish, distribute, sublicense, and/or sell copies of the Software,
|
234
|
-
and to permit persons to whom the Software is furnished to do so,
|
235
|
-
subject to the following conditions:
|
236
|
-
|
237
|
-
The above copyright notice and this permission notice shall be
|
238
|
-
included in all copies or substantial portions of the Software.
|
239
|
-
|
240
|
-
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
241
|
-
EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
|
242
|
-
OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
|
243
|
-
NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
|
244
|
-
BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
|
245
|
-
ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
|
246
|
-
CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
247
|
-
SOFTWARE.
|
248
|
-
-------------------------------------------------------------
|
249
|
-
Code locations:
|
250
|
-
* https://github.com/apache/datasketches-cpp/blob/master/setup.py
|
251
|
-
that is adapted from the above.
|
252
|
-
|
253
|
-
|
254
|
-
|
255
217
|
=============================================================
|
256
218
|
Boost License (https://www.boost.org/LICENSE_1_0.txt)
|
257
219
|
=============================================================
|
@@ -287,44 +249,6 @@ APPENDIX B: Additional licenses relevant to this product.
|
|
287
249
|
of CMake configuration if configured to build tests.
|
288
250
|
|
289
251
|
|
290
|
-
=============================================================
|
291
|
-
BSD License
|
292
|
-
=============================================================
|
293
|
-
Original source code:
|
294
|
-
https://github.com/pybind/pybind11/blob/master/LICENSE
|
295
|
-
|
296
|
-
Copyright (c) 2016 Wenzel Jakob <wenzel.jakob@epfl.ch>, All rights reserved.
|
297
|
-
|
298
|
-
Redistribution and use in source and binary forms, with or without
|
299
|
-
modification, are permitted provided that the following conditions are met:
|
300
|
-
|
301
|
-
1. Redistributions of source code must retain the above copyright notice, this
|
302
|
-
list of conditions and the following disclaimer.
|
303
|
-
|
304
|
-
2. Redistributions in binary form must reproduce the above copyright notice,
|
305
|
-
this list of conditions and the following disclaimer in the documentation
|
306
|
-
and/or other materials provided with the distribution.
|
307
|
-
|
308
|
-
3. Neither the name of the copyright holder nor the names of its contributors
|
309
|
-
may be used to endorse or promote products derived from this software
|
310
|
-
without specific prior written permission.
|
311
|
-
|
312
|
-
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
|
313
|
-
ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
|
314
|
-
WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
315
|
-
DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
|
316
|
-
FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
317
|
-
DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
|
318
|
-
SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
|
319
|
-
CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
|
320
|
-
OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
321
|
-
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
322
|
-
-------------------------------------------------------------
|
323
|
-
Code Locations:
|
324
|
-
Found only in the convenience binaries distributed from PyPI, which rely
|
325
|
-
on pybind11 code during compilation.
|
326
|
-
|
327
|
-
|
328
252
|
=============================================================
|
329
253
|
Public Domain
|
330
254
|
=============================================================
|
@@ -14,9 +14,7 @@ If you are interested in making contributions to this site please see our [Commu
|
|
14
14
|
|
15
15
|
This code requires C++11.
|
16
16
|
|
17
|
-
This
|
18
|
-
|
19
|
-
This library is header-only. The build process provided is only for building unit tests and the python library.
|
17
|
+
This library is header-only. The build process provided is only for building unit tests.
|
20
18
|
|
21
19
|
Building the unit tests requires cmake 3.12.0 or higher.
|
22
20
|
|
@@ -35,19 +35,20 @@ install(TARGETS common EXPORT ${PROJECT_NAME})
|
|
35
35
|
|
36
36
|
install(FILES
|
37
37
|
${CMAKE_CURRENT_BINARY_DIR}/include/version.hpp
|
38
|
+
include/binomial_bounds.hpp
|
39
|
+
include/bounds_binomial_proportions.hpp
|
40
|
+
include/ceiling_power_of_2.hpp
|
38
41
|
include/common_defs.hpp
|
42
|
+
include/conditional_back_inserter.hpp
|
43
|
+
include/conditional_forward.hpp
|
44
|
+
include/count_zeros.hpp
|
45
|
+
include/inv_pow2_table.hpp
|
46
|
+
include/kolmogorov_smirnov_impl.hpp
|
47
|
+
include/kolmogorov_smirnov.hpp
|
39
48
|
include/memory_operations.hpp
|
40
49
|
include/MurmurHash3.h
|
41
|
-
|
42
|
-
|
43
|
-
include/inv_pow2_table.hpp
|
44
|
-
include/binomial_bounds.hpp
|
45
|
-
include/conditional_back_inserter.hpp
|
46
|
-
include/conditional_forward.hpp
|
47
|
-
include/ceiling_power_of_2.hpp
|
48
|
-
include/bounds_binomial_proportions.hpp
|
50
|
+
include/optional.hpp
|
51
|
+
include/quantiles_sorted_view_impl.hpp
|
49
52
|
include/quantiles_sorted_view.hpp
|
50
|
-
|
51
|
-
include/kolmogorov_smirnov.hpp
|
52
|
-
include/kolmogorov_smirnov_impl.hpp
|
53
|
+
include/serde.hpp
|
53
54
|
DESTINATION "${CMAKE_INSTALL_INCLUDEDIR}/DataSketches")
|
@@ -28,27 +28,30 @@
|
|
28
28
|
#include <chrono>
|
29
29
|
#include <thread>
|
30
30
|
|
31
|
+
/// DataSketches namespace
|
31
32
|
namespace datasketches {
|
32
33
|
|
33
34
|
static const uint64_t DEFAULT_SEED = 9001;
|
34
35
|
|
35
36
|
enum resize_factor { X1 = 0, X2, X4, X8 };
|
36
37
|
|
37
|
-
template<typename A> using
|
38
|
-
template<typename A> using string = std::basic_string<char, std::char_traits<char>, AllocChar<A>>;
|
39
|
-
|
40
|
-
// thread-safe random bit
|
41
|
-
static thread_local std::independent_bits_engine<std::mt19937, 1, uint32_t>
|
42
|
-
random_bit(static_cast<uint32_t>(std::chrono::system_clock::now().time_since_epoch().count()
|
43
|
-
+ std::hash<std::thread::id>{}(std::this_thread::get_id())));
|
38
|
+
template<typename A> using string = std::basic_string<char, std::char_traits<char>, typename std::allocator_traits<A>::template rebind_alloc<char>>;
|
44
39
|
|
45
40
|
// common random declarations
|
46
41
|
namespace random_utils {
|
47
42
|
static std::random_device rd; // possibly unsafe in MinGW with GCC < 9.2
|
48
43
|
static thread_local std::mt19937_64 rand(rd());
|
49
44
|
static thread_local std::uniform_real_distribution<> next_double(0.0, 1.0);
|
50
|
-
}
|
51
45
|
|
46
|
+
// thread-safe random bit
|
47
|
+
static thread_local std::independent_bits_engine<std::mt19937, 1, uint32_t>
|
48
|
+
random_bit(static_cast<uint32_t>(std::chrono::system_clock::now().time_since_epoch().count()
|
49
|
+
+ std::hash<std::thread::id>{}(std::this_thread::get_id())));
|
50
|
+
|
51
|
+
inline void override_seed(uint64_t s) {
|
52
|
+
rand.seed(s);
|
53
|
+
}
|
54
|
+
}
|
52
55
|
|
53
56
|
// utility function to hide unused compiler warning
|
54
57
|
// usually has no additional cost
|
@@ -22,13 +22,16 @@
|
|
22
22
|
|
23
23
|
namespace datasketches {
|
24
24
|
|
25
|
+
/**
|
26
|
+
* Kolmogorov-Smirnov test for KLL or Quantiles sketches
|
27
|
+
*/
|
25
28
|
class kolmogorov_smirnov {
|
26
29
|
public:
|
27
30
|
/**
|
28
31
|
* Computes the raw delta area between two quantile sketches for the Kolmogorov-Smirnov Test.
|
29
32
|
* Will work for a type-matched pair of KLL or Quantiles sketches of the same parameterized type T.
|
30
|
-
* @param sketch1
|
31
|
-
* @param sketch2
|
33
|
+
* @param sketch1 sketch 1
|
34
|
+
* @param sketch2 sketch 2
|
32
35
|
* @return the raw delta between two KLL quantile sketches
|
33
36
|
*/
|
34
37
|
template<typename Sketch>
|
@@ -39,8 +42,8 @@ public:
|
|
39
42
|
* Adjusts the computed threshold by the error epsilons of the two given sketches.
|
40
43
|
* See <a href="https://en.wikipedia.org/wiki/Kolmogorov-Smirnov_test">Kolmogorov–Smirnov Test</a>
|
41
44
|
* Will work for a type-matched pair of KLL or Quantiles sketches of the same parameterized type T.
|
42
|
-
* @param sketch1
|
43
|
-
* @param sketch2
|
45
|
+
* @param sketch1 sketch 1
|
46
|
+
* @param sketch2 sketch 2
|
44
47
|
* @param p Target p-value. Typically .001 to .1, e.g., .05.
|
45
48
|
* @return the adjusted threshold to be compared with the raw delta
|
46
49
|
*/
|
@@ -52,8 +55,8 @@ public:
|
|
52
55
|
* Will work for a type-matched pair of KLL or Quantiles sketches of the same parameterized type T.
|
53
56
|
* Note: if the given sketches have insufficient data or if the sketch sizes are too small,
|
54
57
|
* this will return false.
|
55
|
-
* @param sketch1
|
56
|
-
* @param sketch2
|
58
|
+
* @param sketch1 sketch 1
|
59
|
+
* @param sketch2 sketch 2
|
57
60
|
* @param p Target p-value. Typically .001 to .1, e.g., .05.
|
58
61
|
* @return Boolean indicating whether we can reject the null hypothesis (that the sketches
|
59
62
|
* reflect the same underlying distribution) using the provided p-value.
|
@@ -0,0 +1,148 @@
|
|
1
|
+
/*
|
2
|
+
* Licensed to the Apache Software Foundation (ASF) under one
|
3
|
+
* or more contributor license agreements. See the NOTICE file
|
4
|
+
* distributed with this work for additional information
|
5
|
+
* regarding copyright ownership. The ASF licenses this file
|
6
|
+
* to you under the Apache License, Version 2.0 (the
|
7
|
+
* "License"); you may not use this file except in compliance
|
8
|
+
* with the License. You may obtain a copy of the License at
|
9
|
+
*
|
10
|
+
* http://www.apache.org/licenses/LICENSE-2.0
|
11
|
+
*
|
12
|
+
* Unless required by applicable law or agreed to in writing,
|
13
|
+
* software distributed under the License is distributed on an
|
14
|
+
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
15
|
+
* KIND, either express or implied. See the License for the
|
16
|
+
* specific language governing permissions and limitations
|
17
|
+
* under the License.
|
18
|
+
*/
|
19
|
+
|
20
|
+
#ifndef _OPTIONAL_HPP_
|
21
|
+
#define _OPTIONAL_HPP_
|
22
|
+
|
23
|
+
// This is a simplistic substitute for std::optional until we require C++17
|
24
|
+
|
25
|
+
#if (__cplusplus >= 201703L || (defined(_MSVC_LANG) && _MSVC_LANG >= 201703L))
|
26
|
+
#include <optional>
|
27
|
+
using std::optional;
|
28
|
+
#else
|
29
|
+
|
30
|
+
#include <type_traits>
|
31
|
+
|
32
|
+
namespace datasketches {
|
33
|
+
|
34
|
+
template<typename T>
|
35
|
+
class optional {
|
36
|
+
public:
|
37
|
+
|
38
|
+
optional() noexcept: initialized_(false) {}
|
39
|
+
|
40
|
+
optional(const T& value) noexcept(std::is_nothrow_copy_constructible<T>::value) {
|
41
|
+
new (&value_) T(value);
|
42
|
+
initialized_ = true;
|
43
|
+
}
|
44
|
+
|
45
|
+
optional(T&& value) noexcept(std::is_nothrow_move_constructible<T>::value) {
|
46
|
+
new (&value_) T(std::move(value));
|
47
|
+
initialized_ = true;
|
48
|
+
}
|
49
|
+
|
50
|
+
// conversion from compatible types
|
51
|
+
template<typename TT>
|
52
|
+
optional(const optional<TT>& other) noexcept(std::is_nothrow_constructible<T, TT>::value): initialized_(false) {
|
53
|
+
if (other.initialized_) {
|
54
|
+
new (&value_) T(other.value_);
|
55
|
+
initialized_ = true;
|
56
|
+
}
|
57
|
+
}
|
58
|
+
|
59
|
+
optional(const optional& other) noexcept(std::is_nothrow_copy_constructible<T>::value): initialized_(false) {
|
60
|
+
if (other.initialized_) {
|
61
|
+
new (&value_) T(other.value_);
|
62
|
+
initialized_ = true;
|
63
|
+
}
|
64
|
+
}
|
65
|
+
|
66
|
+
optional(optional&& other) noexcept(std::is_nothrow_move_constructible<T>::value): initialized_(false) {
|
67
|
+
if (other.initialized_) {
|
68
|
+
new (&value_) T(std::move(other.value_));
|
69
|
+
initialized_ = true;
|
70
|
+
}
|
71
|
+
}
|
72
|
+
|
73
|
+
~optional() noexcept(std::is_nothrow_destructible<T>::value) {
|
74
|
+
if (initialized_) value_.~T();
|
75
|
+
}
|
76
|
+
|
77
|
+
explicit operator bool() const noexcept {
|
78
|
+
return initialized_;
|
79
|
+
}
|
80
|
+
|
81
|
+
optional& operator=(const optional& other)
|
82
|
+
noexcept(std::is_nothrow_copy_constructible<T>::value && std::is_nothrow_copy_assignable<T>::value) {
|
83
|
+
if (initialized_) {
|
84
|
+
if (other.initialized_) {
|
85
|
+
value_ = other.value_;
|
86
|
+
} else {
|
87
|
+
reset();
|
88
|
+
}
|
89
|
+
} else {
|
90
|
+
if (other.initialized_) {
|
91
|
+
new (&value_) T(other.value_);
|
92
|
+
initialized_ = true;
|
93
|
+
}
|
94
|
+
}
|
95
|
+
return *this;
|
96
|
+
}
|
97
|
+
|
98
|
+
optional& operator=(optional&& other)
|
99
|
+
noexcept(std::is_nothrow_move_constructible<T>::value && std::is_nothrow_move_assignable<T>::value) {
|
100
|
+
if (initialized_) {
|
101
|
+
if (other.initialized_) {
|
102
|
+
value_ = std::move(other.value_);
|
103
|
+
} else {
|
104
|
+
reset();
|
105
|
+
}
|
106
|
+
} else {
|
107
|
+
if (other.initialized_) {
|
108
|
+
new (&value_) T(std::move(other.value_));
|
109
|
+
initialized_ = true;
|
110
|
+
}
|
111
|
+
}
|
112
|
+
return *this;
|
113
|
+
}
|
114
|
+
|
115
|
+
template<typename... Args>
|
116
|
+
void emplace(Args&&... args) noexcept(std::is_nothrow_constructible<T, Args...>::value) {
|
117
|
+
new (&value_) T(args...);
|
118
|
+
initialized_ = true;
|
119
|
+
}
|
120
|
+
|
121
|
+
T& operator*() & noexcept { return value_; }
|
122
|
+
const T& operator*() const & noexcept { return value_; }
|
123
|
+
T&& operator*() && noexcept { return std::move(value_); }
|
124
|
+
const T&& operator*() const && noexcept { return std::move(value_); }
|
125
|
+
|
126
|
+
T* operator->() noexcept { return &value_; }
|
127
|
+
const T* operator->() const noexcept { return &value_; }
|
128
|
+
|
129
|
+
void reset() noexcept(std::is_nothrow_destructible<T>::value) {
|
130
|
+
if (initialized_) value_.~T();
|
131
|
+
initialized_ = false;
|
132
|
+
}
|
133
|
+
|
134
|
+
private:
|
135
|
+
union {
|
136
|
+
T value_;
|
137
|
+
};
|
138
|
+
bool initialized_;
|
139
|
+
|
140
|
+
// for converting constructor
|
141
|
+
template<typename TT> friend class optional;
|
142
|
+
};
|
143
|
+
|
144
|
+
} // namespace
|
145
|
+
|
146
|
+
#endif // C++17
|
147
|
+
|
148
|
+
#endif // _OPTIONAL_HPP_
|
@@ -27,6 +27,9 @@
|
|
27
27
|
|
28
28
|
namespace datasketches {
|
29
29
|
|
30
|
+
/**
|
31
|
+
* Sorted view for quantiles sketches (REQ, KLL and Quantiles)
|
32
|
+
*/
|
30
33
|
template<
|
31
34
|
typename T,
|
32
35
|
typename Comparator, // strict weak ordering function (see C++ named requirements: Compare)
|
@@ -34,30 +37,119 @@ template<
|
|
34
37
|
>
|
35
38
|
class quantiles_sorted_view {
|
36
39
|
public:
|
40
|
+
/// Entry type
|
37
41
|
using Entry = typename std::conditional<std::is_arithmetic<T>::value, std::pair<T, uint64_t>, std::pair<const T*, uint64_t>>::type;
|
38
42
|
using AllocEntry = typename std::allocator_traits<Allocator>::template rebind_alloc<Entry>;
|
39
43
|
using Container = std::vector<Entry, AllocEntry>;
|
40
44
|
|
45
|
+
/// @private
|
41
46
|
quantiles_sorted_view(uint32_t num, const Comparator& comparator, const Allocator& allocator);
|
42
47
|
|
48
|
+
/// @private
|
43
49
|
template<typename Iterator>
|
44
50
|
void add(Iterator begin, Iterator end, uint64_t weight);
|
45
51
|
|
52
|
+
/// @private
|
46
53
|
void convert_to_cummulative();
|
47
54
|
|
48
55
|
class const_iterator;
|
56
|
+
|
57
|
+
/**
|
58
|
+
* Iterator pointing to the first entry in the view.
|
59
|
+
* If the view is empty, the returned iterator must not be dereferenced or incremented.
|
60
|
+
* @return iterator pointing to the first entry
|
61
|
+
*/
|
49
62
|
const_iterator begin() const;
|
63
|
+
|
64
|
+
/**
|
65
|
+
* Iterator pointing to the past-the-end entry in the view.
|
66
|
+
* The past-the-end entry is the hypothetical entry that would follow the last entry.
|
67
|
+
* It does not point to any entry, and must not be dereferenced or incremented.
|
68
|
+
* @return iterator pointing to the past-the-end entry
|
69
|
+
*/
|
50
70
|
const_iterator end() const;
|
51
71
|
|
72
|
+
/// @return size of the view
|
52
73
|
size_t size() const;
|
53
74
|
|
75
|
+
/**
|
76
|
+
* Returns an approximation to the normalized rank of the given item.
|
77
|
+
*
|
78
|
+
* <p>If the view is empty this throws std::runtime_error.
|
79
|
+
*
|
80
|
+
* @param item to be ranked
|
81
|
+
* @param inclusive if true the weight of the given item is included into the rank.
|
82
|
+
* Otherwise the rank equals the sum of the weights of all items that are less than the given item
|
83
|
+
* according to the Comparator.
|
84
|
+
*
|
85
|
+
* @return an approximate normalized rank of the given item (0 to 1 inclusive)
|
86
|
+
*/
|
54
87
|
double get_rank(const T& item, bool inclusive = true) const;
|
55
88
|
|
89
|
+
/**
|
90
|
+
* Quantile return type.
|
91
|
+
* This is to return quantiles either by value (for arithmetic types) or by const reference (for all other types)
|
92
|
+
*/
|
56
93
|
using quantile_return_type = typename std::conditional<std::is_arithmetic<T>::value, T, const T&>::type;
|
94
|
+
|
95
|
+
/**
|
96
|
+
* Returns an item from the sketch that is the best approximation to an item
|
97
|
+
* from the original stream with the given normalized rank.
|
98
|
+
*
|
99
|
+
* <p>If the view is empty this throws std::runtime_error.
|
100
|
+
*
|
101
|
+
* @param rank of an item in the hypothetical sorted stream.
|
102
|
+
* @param inclusive if true, the given rank is considered inclusive (includes weight of an item)
|
103
|
+
*
|
104
|
+
* @return approximate quantile associated with the given normalized rank
|
105
|
+
*/
|
57
106
|
quantile_return_type get_quantile(double rank, bool inclusive = true) const;
|
58
107
|
|
59
108
|
using vector_double = std::vector<double, typename std::allocator_traits<Allocator>::template rebind_alloc<double>>;
|
109
|
+
|
110
|
+
/**
|
111
|
+
* Returns an approximation to the Cumulative Distribution Function (CDF), which is the
|
112
|
+
* cumulative analog of the PMF, of the input stream given a set of split points (items).
|
113
|
+
*
|
114
|
+
* <p>If the view is empty this throws std::runtime_error.
|
115
|
+
*
|
116
|
+
* @param split_points an array of <i>m</i> unique, monotonically increasing items
|
117
|
+
* that divide the input domain into <i>m+1</i> consecutive disjoint intervals.
|
118
|
+
*
|
119
|
+
* @param size the number of split points in the array
|
120
|
+
*
|
121
|
+
* @param inclusive if true the rank of an item includes its own weight, and therefore
|
122
|
+
* if the sketch contains items equal to a slit point, then in CDF such items are
|
123
|
+
* included into the interval to the left of split point. Otherwise they are included into
|
124
|
+
* the interval to the right of split point.
|
125
|
+
*
|
126
|
+
* @return an array of m+1 doubles, which are a consecutive approximation to the CDF
|
127
|
+
* of the input stream given the split_points. The value at array position j of the returned
|
128
|
+
* CDF array is the sum of the returned values in positions 0 through j of the returned PMF
|
129
|
+
* array. This can be viewed as array of ranks of the given split points plus one more value
|
130
|
+
* that is always 1.
|
131
|
+
*/
|
60
132
|
vector_double get_CDF(const T* split_points, uint32_t size, bool inclusive = true) const;
|
133
|
+
|
134
|
+
/**
|
135
|
+
* Returns an approximation to the Probability Mass Function (PMF) of the input stream
|
136
|
+
* given a set of split points (items).
|
137
|
+
*
|
138
|
+
* <p>If the view is empty this throws std::runtime_error.
|
139
|
+
*
|
140
|
+
* @param split_points an array of <i>m</i> unique, monotonically increasing items
|
141
|
+
* that divide the input domain into <i>m+1</i> consecutive disjoint intervals (bins).
|
142
|
+
*
|
143
|
+
* @param size the number of split points in the array
|
144
|
+
*
|
145
|
+
* @param inclusive if true the rank of an item includes its own weight, and therefore
|
146
|
+
* if the sketch contains items equal to a slit point, then in PMF such items are
|
147
|
+
* included into the interval to the left of split point. Otherwise they are included into the interval
|
148
|
+
* to the right of split point.
|
149
|
+
*
|
150
|
+
* @return an array of m+1 doubles each of which is an approximation
|
151
|
+
* to the fraction of the input stream items (the mass) that fall into one of those intervals.
|
152
|
+
*/
|
61
153
|
vector_double get_PMF(const T* split_points, uint32_t size, bool inclusive = true) const;
|
62
154
|
|
63
155
|
private:
|
@@ -122,8 +214,6 @@ public:
|
|
122
214
|
using Base = typename quantiles_sorted_view<T, C, A>::Container::const_iterator;
|
123
215
|
using value_type = typename std::conditional<std::is_arithmetic<T>::value, typename Base::value_type, std::pair<const T&, const uint64_t>>::type;
|
124
216
|
|
125
|
-
const_iterator(const Base& it, const Base& begin): Base(it), begin(begin) {}
|
126
|
-
|
127
217
|
template<typename TT = T, typename std::enable_if<std::is_arithmetic<TT>::value, int>::type = 0>
|
128
218
|
const value_type operator*() const { return Base::operator*(); }
|
129
219
|
|
@@ -147,6 +237,9 @@ public:
|
|
147
237
|
|
148
238
|
private:
|
149
239
|
Base begin;
|
240
|
+
|
241
|
+
friend class quantiles_sorted_view<T, C, A>;
|
242
|
+
const_iterator(const Base& it, const Base& begin): Base(it), begin(begin) {}
|
150
243
|
};
|
151
244
|
|
152
245
|
} /* namespace datasketches */
|
@@ -75,7 +75,7 @@ double quantiles_sorted_view<T, C, A>::get_rank(const T& item, bool inclusive) c
|
|
75
75
|
template<typename T, typename C, typename A>
|
76
76
|
auto quantiles_sorted_view<T, C, A>::get_quantile(double rank, bool inclusive) const -> quantile_return_type {
|
77
77
|
if (entries_.empty()) throw std::runtime_error("operation is undefined for an empty sketch");
|
78
|
-
uint64_t weight = inclusive ? std::ceil(rank * total_weight_) : rank * total_weight_;
|
78
|
+
uint64_t weight = static_cast<uint64_t>(inclusive ? std::ceil(rank * total_weight_) : rank * total_weight_);
|
79
79
|
auto it = inclusive ?
|
80
80
|
std::lower_bound(entries_.begin(), entries_.end(), make_dummy_entry<T>(weight), compare_pairs_by_second())
|
81
81
|
: std::upper_bound(entries_.begin(), entries_.end(), make_dummy_entry<T>(weight), compare_pairs_by_second());
|