catboost 1.25.1 → 1.26.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (289) hide show
  1. package/DEPLOYMENT.md +22 -15
  2. package/README.md +37 -27
  3. package/binding.gyp +5 -7
  4. package/build_scripts/bootstrap.js +2 -1
  5. package/build_scripts/out/build.js +46 -68
  6. package/build_scripts/out/build_model.js +1 -1
  7. package/build_scripts/out/{build_ya.js → build_native.js} +1 -1
  8. package/build_scripts/out/ci.js +5 -5
  9. package/build_scripts/out/config.js +32 -18
  10. package/build_scripts/out/install.js +5 -3
  11. package/build_scripts/out/package_prepublish.js +1 -1
  12. package/build_scripts/out/packaging.js +1 -19
  13. package/build_scripts/out/run_tests.js +1 -1
  14. package/build_scripts/out/test.js +8 -3
  15. package/config.json +18 -11
  16. package/inc/catboost/libs/model_interface/c_api.h +349 -3
  17. package/lib/catboost.d.ts +65 -21
  18. package/package.json +4 -4
  19. package/src/api_helpers.cpp +100 -24
  20. package/src/api_helpers.h +8 -7
  21. package/src/api_module.cpp +1 -2
  22. package/src/model.cpp +483 -83
  23. package/src/model.h +24 -9
  24. package/inc/contrib/libs/cxxsupp/system_stl/include/stlfwd +0 -14
  25. package/inc/util/charset/recode_result.h +0 -9
  26. package/inc/util/charset/unicode_table.h +0 -123
  27. package/inc/util/charset/unidata.h +0 -421
  28. package/inc/util/charset/utf8.h +0 -384
  29. package/inc/util/charset/wide.h +0 -843
  30. package/inc/util/charset/wide_specific.h +0 -22
  31. package/inc/util/datetime/base.h +0 -669
  32. package/inc/util/datetime/constants.h +0 -7
  33. package/inc/util/datetime/cputimer.h +0 -124
  34. package/inc/util/datetime/parser.h +0 -292
  35. package/inc/util/datetime/systime.h +0 -47
  36. package/inc/util/datetime/uptime.h +0 -8
  37. package/inc/util/digest/city.h +0 -88
  38. package/inc/util/digest/fnv.h +0 -73
  39. package/inc/util/digest/multi.h +0 -14
  40. package/inc/util/digest/murmur.h +0 -57
  41. package/inc/util/digest/numeric.h +0 -86
  42. package/inc/util/digest/sequence.h +0 -48
  43. package/inc/util/draft/date.h +0 -129
  44. package/inc/util/draft/datetime.h +0 -184
  45. package/inc/util/draft/enum.h +0 -136
  46. package/inc/util/draft/holder_vector.h +0 -102
  47. package/inc/util/draft/ip.h +0 -131
  48. package/inc/util/draft/matrix.h +0 -108
  49. package/inc/util/draft/memory.h +0 -40
  50. package/inc/util/folder/dirent_win.h +0 -46
  51. package/inc/util/folder/dirut.h +0 -121
  52. package/inc/util/folder/filelist.h +0 -81
  53. package/inc/util/folder/fts.h +0 -108
  54. package/inc/util/folder/iterator.h +0 -109
  55. package/inc/util/folder/lstat_win.h +0 -20
  56. package/inc/util/folder/path.h +0 -225
  57. package/inc/util/folder/pathsplit.h +0 -113
  58. package/inc/util/folder/tempdir.h +0 -42
  59. package/inc/util/generic/adaptor.h +0 -134
  60. package/inc/util/generic/algorithm.h +0 -765
  61. package/inc/util/generic/array_ref.h +0 -282
  62. package/inc/util/generic/array_size.h +0 -24
  63. package/inc/util/generic/benchmark/vector_count_ctor/f.h +0 -9
  64. package/inc/util/generic/bitmap.h +0 -1115
  65. package/inc/util/generic/bitops.h +0 -459
  66. package/inc/util/generic/bt_exception.h +0 -24
  67. package/inc/util/generic/buffer.h +0 -232
  68. package/inc/util/generic/cast.h +0 -176
  69. package/inc/util/generic/deque.h +0 -24
  70. package/inc/util/generic/explicit_type.h +0 -42
  71. package/inc/util/generic/fastqueue.h +0 -55
  72. package/inc/util/generic/flags.h +0 -244
  73. package/inc/util/generic/function.h +0 -103
  74. package/inc/util/generic/fwd.h +0 -171
  75. package/inc/util/generic/guid.h +0 -61
  76. package/inc/util/generic/hash.h +0 -2032
  77. package/inc/util/generic/hash_primes.h +0 -140
  78. package/inc/util/generic/hash_set.h +0 -490
  79. package/inc/util/generic/hide_ptr.h +0 -3
  80. package/inc/util/generic/intrlist.h +0 -876
  81. package/inc/util/generic/is_in.h +0 -53
  82. package/inc/util/generic/iterator.h +0 -137
  83. package/inc/util/generic/iterator_range.h +0 -105
  84. package/inc/util/generic/lazy_value.h +0 -66
  85. package/inc/util/generic/list.h +0 -22
  86. package/inc/util/generic/map.h +0 -44
  87. package/inc/util/generic/mapfindptr.h +0 -60
  88. package/inc/util/generic/maybe.h +0 -713
  89. package/inc/util/generic/maybe_traits.h +0 -164
  90. package/inc/util/generic/mem_copy.h +0 -55
  91. package/inc/util/generic/noncopyable.h +0 -38
  92. package/inc/util/generic/object_counter.h +0 -53
  93. package/inc/util/generic/ptr.h +0 -1113
  94. package/inc/util/generic/queue.h +0 -57
  95. package/inc/util/generic/refcount.h +0 -162
  96. package/inc/util/generic/reserve.h +0 -11
  97. package/inc/util/generic/scope.h +0 -65
  98. package/inc/util/generic/serialized_enum.h +0 -406
  99. package/inc/util/generic/set.h +0 -42
  100. package/inc/util/generic/singleton.h +0 -136
  101. package/inc/util/generic/size_literals.h +0 -65
  102. package/inc/util/generic/stack.h +0 -18
  103. package/inc/util/generic/store_policy.h +0 -120
  104. package/inc/util/generic/strbase.h +0 -612
  105. package/inc/util/generic/strbuf.h +0 -552
  106. package/inc/util/generic/strfcpy.h +0 -17
  107. package/inc/util/generic/string.h +0 -1572
  108. package/inc/util/generic/string_hash.h +0 -21
  109. package/inc/util/generic/string_ut.h +0 -1175
  110. package/inc/util/generic/type_name.h +0 -34
  111. package/inc/util/generic/typelist.h +0 -114
  112. package/inc/util/generic/typetraits.h +0 -325
  113. package/inc/util/generic/utility.h +0 -132
  114. package/inc/util/generic/va_args.h +0 -400
  115. package/inc/util/generic/variant.h +0 -631
  116. package/inc/util/generic/variant_traits.h +0 -171
  117. package/inc/util/generic/vector.h +0 -119
  118. package/inc/util/generic/xrange.h +0 -258
  119. package/inc/util/generic/yexception.h +0 -212
  120. package/inc/util/generic/yexception_ut.h +0 -14
  121. package/inc/util/generic/ylimits.h +0 -92
  122. package/inc/util/generic/ymath.h +0 -206
  123. package/inc/util/memory/addstorage.h +0 -93
  124. package/inc/util/memory/alloc.h +0 -27
  125. package/inc/util/memory/blob.h +0 -296
  126. package/inc/util/memory/mmapalloc.h +0 -8
  127. package/inc/util/memory/pool.h +0 -432
  128. package/inc/util/memory/segmented_string_pool.h +0 -194
  129. package/inc/util/memory/segpool_alloc.h +0 -118
  130. package/inc/util/memory/smallobj.h +0 -141
  131. package/inc/util/memory/tempbuf.h +0 -111
  132. package/inc/util/network/address.h +0 -136
  133. package/inc/util/network/endpoint.h +0 -61
  134. package/inc/util/network/hostip.h +0 -16
  135. package/inc/util/network/init.h +0 -60
  136. package/inc/util/network/interface.h +0 -17
  137. package/inc/util/network/iovec.h +0 -65
  138. package/inc/util/network/ip.h +0 -116
  139. package/inc/util/network/nonblock.h +0 -8
  140. package/inc/util/network/pair.h +0 -9
  141. package/inc/util/network/poller.h +0 -58
  142. package/inc/util/network/pollerimpl.h +0 -707
  143. package/inc/util/network/sock.h +0 -608
  144. package/inc/util/network/socket.h +0 -421
  145. package/inc/util/random/common_ops.h +0 -130
  146. package/inc/util/random/easy.h +0 -47
  147. package/inc/util/random/entropy.h +0 -21
  148. package/inc/util/random/fast.h +0 -101
  149. package/inc/util/random/init_atfork.h +0 -3
  150. package/inc/util/random/lcg_engine.h +0 -66
  151. package/inc/util/random/mersenne.h +0 -46
  152. package/inc/util/random/mersenne32.h +0 -50
  153. package/inc/util/random/mersenne64.h +0 -50
  154. package/inc/util/random/normal.h +0 -38
  155. package/inc/util/random/random.h +0 -30
  156. package/inc/util/random/shuffle.h +0 -39
  157. package/inc/util/str_stl.h +0 -266
  158. package/inc/util/stream/aligned.h +0 -99
  159. package/inc/util/stream/buffer.h +0 -119
  160. package/inc/util/stream/buffered.h +0 -225
  161. package/inc/util/stream/debug.h +0 -53
  162. package/inc/util/stream/direct_io.h +0 -43
  163. package/inc/util/stream/file.h +0 -108
  164. package/inc/util/stream/format.h +0 -444
  165. package/inc/util/stream/fwd.h +0 -100
  166. package/inc/util/stream/hex.h +0 -8
  167. package/inc/util/stream/holder.h +0 -44
  168. package/inc/util/stream/input.h +0 -273
  169. package/inc/util/stream/labeled.h +0 -19
  170. package/inc/util/stream/length.h +0 -100
  171. package/inc/util/stream/mem.h +0 -255
  172. package/inc/util/stream/multi.h +0 -32
  173. package/inc/util/stream/null.h +0 -61
  174. package/inc/util/stream/output.h +0 -304
  175. package/inc/util/stream/pipe.h +0 -112
  176. package/inc/util/stream/printf.h +0 -25
  177. package/inc/util/stream/str.h +0 -207
  178. package/inc/util/stream/tee.h +0 -28
  179. package/inc/util/stream/tempbuf.h +0 -21
  180. package/inc/util/stream/tokenizer.h +0 -214
  181. package/inc/util/stream/trace.h +0 -60
  182. package/inc/util/stream/walk.h +0 -35
  183. package/inc/util/stream/zerocopy.h +0 -91
  184. package/inc/util/stream/zerocopy_output.h +0 -57
  185. package/inc/util/stream/zlib.h +0 -173
  186. package/inc/util/string/ascii.h +0 -236
  187. package/inc/util/string/builder.h +0 -39
  188. package/inc/util/string/cast.h +0 -347
  189. package/inc/util/string/cstriter.h +0 -14
  190. package/inc/util/string/escape.h +0 -70
  191. package/inc/util/string/hex.h +0 -59
  192. package/inc/util/string/join.h +0 -194
  193. package/inc/util/string/printf.h +0 -13
  194. package/inc/util/string/reverse.h +0 -16
  195. package/inc/util/string/split.h +0 -1080
  196. package/inc/util/string/strip.h +0 -257
  197. package/inc/util/string/strspn.h +0 -65
  198. package/inc/util/string/subst.h +0 -56
  199. package/inc/util/string/type.h +0 -50
  200. package/inc/util/string/util.h +0 -195
  201. package/inc/util/string/vector.h +0 -132
  202. package/inc/util/system/align.h +0 -50
  203. package/inc/util/system/atexit.h +0 -22
  204. package/inc/util/system/atomic.h +0 -51
  205. package/inc/util/system/atomic_gcc.h +0 -90
  206. package/inc/util/system/atomic_ops.h +0 -189
  207. package/inc/util/system/atomic_win.h +0 -114
  208. package/inc/util/system/backtrace.h +0 -39
  209. package/inc/util/system/byteorder.h +0 -186
  210. package/inc/util/system/compat.h +0 -84
  211. package/inc/util/system/compiler.h +0 -620
  212. package/inc/util/system/condvar.h +0 -71
  213. package/inc/util/system/context.h +0 -181
  214. package/inc/util/system/context_aarch64.h +0 -8
  215. package/inc/util/system/context_i686.h +0 -9
  216. package/inc/util/system/context_x86.h +0 -12
  217. package/inc/util/system/context_x86_64.h +0 -7
  218. package/inc/util/system/cpu_id.h +0 -159
  219. package/inc/util/system/daemon.h +0 -28
  220. package/inc/util/system/datetime.h +0 -98
  221. package/inc/util/system/defaults.h +0 -149
  222. package/inc/util/system/demangle.h +0 -5
  223. package/inc/util/system/demangle_impl.h +0 -23
  224. package/inc/util/system/direct_io.h +0 -71
  225. package/inc/util/system/dynlib.h +0 -119
  226. package/inc/util/system/env.h +0 -32
  227. package/inc/util/system/error.h +0 -95
  228. package/inc/util/system/event.h +0 -122
  229. package/inc/util/system/execpath.h +0 -17
  230. package/inc/util/system/fasttime.h +0 -6
  231. package/inc/util/system/fhandle.h +0 -27
  232. package/inc/util/system/file.h +0 -210
  233. package/inc/util/system/file_lock.h +0 -34
  234. package/inc/util/system/filemap.h +0 -383
  235. package/inc/util/system/flock.h +0 -35
  236. package/inc/util/system/fs.h +0 -156
  237. package/inc/util/system/fs_win.h +0 -29
  238. package/inc/util/system/fstat.h +0 -46
  239. package/inc/util/system/getpid.h +0 -12
  240. package/inc/util/system/guard.h +0 -179
  241. package/inc/util/system/hi_lo.h +0 -139
  242. package/inc/util/system/hostname.h +0 -10
  243. package/inc/util/system/hp_timer.h +0 -36
  244. package/inc/util/system/info.h +0 -12
  245. package/inc/util/system/interrupt_signals.h +0 -22
  246. package/inc/util/system/madvise.h +0 -30
  247. package/inc/util/system/maxlen.h +0 -32
  248. package/inc/util/system/mem_info.h +0 -18
  249. package/inc/util/system/mincore.h +0 -38
  250. package/inc/util/system/mktemp.h +0 -11
  251. package/inc/util/system/mlock.h +0 -43
  252. package/inc/util/system/mutex.h +0 -67
  253. package/inc/util/system/nice.h +0 -3
  254. package/inc/util/system/pipe.h +0 -90
  255. package/inc/util/system/platform.h +0 -246
  256. package/inc/util/system/progname.h +0 -13
  257. package/inc/util/system/protect.h +0 -25
  258. package/inc/util/system/rusage.h +0 -26
  259. package/inc/util/system/rwlock.h +0 -78
  260. package/inc/util/system/sanitizers.h +0 -122
  261. package/inc/util/system/sem.h +0 -41
  262. package/inc/util/system/shellcommand.h +0 -472
  263. package/inc/util/system/shmat.h +0 -32
  264. package/inc/util/system/sigset.h +0 -78
  265. package/inc/util/system/spin_wait.h +0 -10
  266. package/inc/util/system/spinlock.h +0 -121
  267. package/inc/util/system/src_location.h +0 -25
  268. package/inc/util/system/src_root.h +0 -68
  269. package/inc/util/system/sys_alloc.h +0 -43
  270. package/inc/util/system/sysstat.h +0 -52
  271. package/inc/util/system/tempfile.h +0 -34
  272. package/inc/util/system/thread.h +0 -167
  273. package/inc/util/system/tls.h +0 -307
  274. package/inc/util/system/types.h +0 -119
  275. package/inc/util/system/unaligned_mem.h +0 -67
  276. package/inc/util/system/user.h +0 -5
  277. package/inc/util/system/utime.h +0 -6
  278. package/inc/util/system/valgrind.h +0 -48
  279. package/inc/util/system/winint.h +0 -43
  280. package/inc/util/system/yassert.h +0 -121
  281. package/inc/util/system/yield.h +0 -4
  282. package/inc/util/thread/factory.h +0 -65
  283. package/inc/util/thread/fwd.h +0 -30
  284. package/inc/util/thread/lfqueue.h +0 -406
  285. package/inc/util/thread/lfstack.h +0 -188
  286. package/inc/util/thread/pool.h +0 -388
  287. package/inc/util/thread/singleton.h +0 -42
  288. package/inc/util/ysafeptr.h +0 -427
  289. package/inc/util/ysaveload.h +0 -700
@@ -1,552 +0,0 @@
1
- #pragma once
2
-
3
- #include "fwd.h"
4
- #include "strbase.h"
5
- #include "utility.h"
6
- #include "typetraits.h"
7
-
8
- #include <string_view>
9
-
10
- template <typename TCharType, typename TTraits>
11
- class TBasicStringBuf:
12
- public std::basic_string_view<TCharType>,
13
- public TStringBase<TBasicStringBuf<TCharType, TTraits>, TCharType, TTraits>
14
- {
15
- private:
16
- using TdSelf = TBasicStringBuf;
17
- using TBase = TStringBase<TdSelf, TCharType, TTraits>;
18
- using TStringView = std::basic_string_view<TCharType>;
19
-
20
- public:
21
- using char_type = TCharType; // TODO: DROP
22
- using traits_type = TTraits;
23
-
24
- //Resolving some ambiguity between TStringBase and std::basic_string_view
25
- //for typenames
26
- using typename TStringView::size_type;
27
- using typename TStringView::value_type;
28
- using typename TStringView::iterator;
29
- using typename TStringView::const_iterator;
30
- using typename TStringView::reverse_iterator;
31
- using typename TStringView::const_reverse_iterator;
32
- using typename TStringView::reference;
33
- using typename TStringView::const_reference;
34
-
35
- //for constants
36
- using TStringView::npos;
37
-
38
- //for methods and operators
39
- using TStringView::begin;
40
- using TStringView::end;
41
- using TStringView::cbegin;
42
- using TStringView::cend;
43
- using TStringView::rbegin;
44
- using TStringView::rend;
45
- using TStringView::crbegin;
46
- using TStringView::crend;
47
-
48
- using TStringView::size;
49
- using TStringView::empty;
50
- using TStringView::data;
51
-
52
- using TStringView::operator[];
53
-
54
- /*
55
- * WARN:
56
- * TBase::at silently return 0 in case of range error,
57
- * while std::string_view throws std::out_of_range.
58
- */
59
- using TBase::at;
60
- using TStringView::front;
61
- using TStringView::back;
62
-
63
- using TStringView::find;
64
- /*
65
- * WARN:
66
- * TBase::*find* methods take into account TCharTraits,
67
- * while TTStringView::*find* would use default std::char_traits.
68
- */
69
- using TBase::rfind;
70
- using TBase::find_first_of;
71
- using TBase::find_first_not_of;
72
- using TBase::find_last_of;
73
- using TBase::find_last_not_of;
74
-
75
- using TStringView::copy;
76
- /*
77
- * WARN:
78
- * TBase::compare takes into account TCharTraits,
79
- * thus making it possible to implement case-insensitive string buffers,
80
- * if it is using TStringBase::compare
81
- */
82
- using TBase::compare;
83
-
84
- /*
85
- * WARN:
86
- * TBase::substr properly checks boundary cases and clamps them with maximum valid values,
87
- * while TStringView::substr throws std::out_of_range error.
88
- */
89
- using TBase::substr;
90
-
91
- /*
92
- * WARN:
93
- * Constructing std::string_view(nullptr, non_zero_size) ctor
94
- * results in undefined behavior according to the standard.
95
- * In libc++ this UB results in runtime assertion, though it is better
96
- * to generate compilation error instead.
97
- */
98
- constexpr inline TBasicStringBuf(std::nullptr_t begin, size_t size) = delete;
99
-
100
- constexpr inline TBasicStringBuf(const TCharType* data, size_t size) noexcept
101
- : TStringView(data, size)
102
- {
103
- }
104
-
105
- _LIBCPP_CONSTEXPR_AFTER_CXX14
106
- inline TBasicStringBuf(const TCharType* data) noexcept
107
- /*
108
- * WARN: TBase::StrLen properly handles nullptr,
109
- * while std::string_view (using std::char_traits) will abort in such case
110
- */
111
- : TStringView(data, TBase::StrLen(data))
112
- {
113
- }
114
-
115
- constexpr inline TBasicStringBuf(const TCharType* beg, const TCharType* end) noexcept
116
- : TStringView(beg, end - beg)
117
- {
118
- }
119
-
120
- template <typename D, typename T>
121
- inline TBasicStringBuf(const TStringBase<D, TCharType, T>& str) noexcept
122
- : TStringView(str.data(), str.size())
123
- {
124
- }
125
-
126
- template <typename T, typename A>
127
- inline TBasicStringBuf(const std::basic_string<TCharType, T, A>& str) noexcept
128
- : TStringView(str)
129
- {
130
- }
131
-
132
- template <typename TCharTraits>
133
- constexpr TBasicStringBuf(std::basic_string_view<TCharType, TCharTraits> view) noexcept
134
- : TStringView(view)
135
- {
136
- }
137
-
138
- constexpr inline TBasicStringBuf() noexcept
139
- {
140
- /*
141
- * WARN:
142
- * This ctor can not be defaulted due to the following feature of default initialization:
143
- * If T is a const-qualified type, it must be a class type with a user-provided default constructor.
144
- * (see https://en.cppreference.com/w/cpp/language/default_initialization).
145
- *
146
- * This means, that a class with default ctor can not be a constant member of another class with default ctor.
147
- */
148
- }
149
-
150
- inline TBasicStringBuf(const TBasicStringBuf& src, size_t pos, size_t n) noexcept
151
- : TBasicStringBuf(src)
152
- {
153
- Skip(pos).Trunc(n);
154
- }
155
-
156
- inline TBasicStringBuf(const TBasicStringBuf& src, size_t pos) noexcept
157
- : TBasicStringBuf(src, pos, TBase::npos)
158
- {
159
- }
160
-
161
- Y_PURE_FUNCTION
162
- inline TBasicStringBuf SubString(size_t pos, size_t n) const noexcept {
163
- pos = Min(pos, size());
164
- n = Min(n, size() - pos);
165
- return TBasicStringBuf(data() + pos, n);
166
- }
167
-
168
- public:
169
- void Clear() {
170
- *this = TdSelf();
171
- }
172
-
173
- constexpr bool IsInited() const noexcept {
174
- return data() != nullptr;
175
- }
176
-
177
- public:
178
- /**
179
- * Tries to split string in two parts using given delimiter character.
180
- * Searches for the delimiter, scanning string from the beginning.
181
- * The delimiter is excluded from the result. Both out parameters are
182
- * left unmodified if there was no delimiter character in string.
183
- *
184
- * @param[in] delim Delimiter character.
185
- * @param[out] l The first part of split result.
186
- * @param[out] r The second part of split result.
187
- * @returns Whether the split was actually performed.
188
- */
189
- inline bool TrySplit(TCharType delim, TdSelf& l, TdSelf& r) const noexcept {
190
- return TrySplitOn(TBase::find(delim), l, r);
191
- }
192
-
193
- /**
194
- * Tries to split string in two parts using given delimiter character.
195
- * Searches for the delimiter, scanning string from the end.
196
- * The delimiter is excluded from the result. Both out parameters are
197
- * left unmodified if there was no delimiter character in string.
198
- *
199
- * @param[in] delim Delimiter character.
200
- * @param[out] l The first part of split result.
201
- * @param[out] r The second part of split result.
202
- * @returns Whether the split was actually performed.
203
- */
204
- inline bool TryRSplit(TCharType delim, TdSelf& l, TdSelf& r) const noexcept {
205
- return TrySplitOn(TBase::rfind(delim), l, r);
206
- }
207
-
208
- /**
209
- * Tries to split string in two parts using given delimiter sequence.
210
- * Searches for the delimiter, scanning string from the beginning.
211
- * The delimiter sequence is excluded from the result. Both out parameters
212
- * are left unmodified if there was no delimiter character in string.
213
- *
214
- * @param[in] delim Delimiter sequence.
215
- * @param[out] l The first part of split result.
216
- * @param[out] r The second part of split result.
217
- * @returns Whether the split was actually performed.
218
- */
219
- inline bool TrySplit(TdSelf delim, TdSelf& l, TdSelf& r) const noexcept {
220
- return TrySplitOn(TBase::find(delim), l, r, delim.size());
221
- }
222
-
223
- /**
224
- * Tries to split string in two parts using given delimiter sequence.
225
- * Searches for the delimiter, scanning string from the end.
226
- * The delimiter sequence is excluded from the result. Both out parameters
227
- * are left unmodified if there was no delimiter character in string.
228
- *
229
- * @param[in] delim Delimiter sequence.
230
- * @param[out] l The first part of split result.
231
- * @param[out] r The second part of split result.
232
- * @returns Whether the split was actually performed.
233
- */
234
- inline bool TryRSplit(TdSelf delim, TdSelf& l, TdSelf& r) const noexcept {
235
- return TrySplitOn(TBase::rfind(delim), l, r, delim.size());
236
- }
237
-
238
- inline void Split(TCharType delim, TdSelf& l, TdSelf& r) const noexcept {
239
- SplitTemplate(delim, l, r);
240
- }
241
-
242
- inline void RSplit(TCharType delim, TdSelf& l, TdSelf& r) const noexcept {
243
- RSplitTemplate(delim, l, r);
244
- }
245
-
246
- inline void Split(TdSelf delim, TdSelf& l, TdSelf& r) const noexcept {
247
- SplitTemplate(delim, l, r);
248
- }
249
-
250
- inline void RSplit(TdSelf delim, TdSelf& l, TdSelf& r) const noexcept {
251
- RSplitTemplate(delim, l, r);
252
- }
253
-
254
- private:
255
- // splits on a delimiter at a given position; delimiter is excluded
256
- void DoSplitOn(size_t pos, TdSelf& l, TdSelf& r, size_t len) const noexcept {
257
- Y_ASSERT(pos != TBase::npos);
258
-
259
- // make a copy in case one of l/r is really *this
260
- const TdSelf tok = SubStr(pos + len);
261
- l = Head(pos);
262
- r = tok;
263
- }
264
-
265
- public:
266
- // In all methods below with @pos parameter, @pos is supposed to be
267
- // a result of string find()/rfind()/find_first() or other similiar functions,
268
- // returning either position within string length [0..size()) or npos.
269
- // For all other @pos values (out of string index range) the behaviour isn't well defined
270
- // For example, for TStringBuf s("abc"):
271
- // s.TrySplitOn(s.find('z'), ...) is false, but s.TrySplitOn(100500, ...) is true.
272
-
273
- bool TrySplitOn(size_t pos, TdSelf& l, TdSelf& r, size_t len = 1) const noexcept {
274
- if (TBase::npos == pos)
275
- return false;
276
-
277
- DoSplitOn(pos, l, r, len);
278
- return true;
279
- }
280
-
281
- void SplitOn(size_t pos, TdSelf& l, TdSelf& r, size_t len = 1) const noexcept {
282
- if (!TrySplitOn(pos, l, r, len)) {
283
- l = *this;
284
- r = TdSelf();
285
- }
286
- }
287
-
288
- bool TrySplitAt(size_t pos, TdSelf& l, TdSelf& r) const noexcept {
289
- return TrySplitOn(pos, l, r, 0);
290
- }
291
-
292
- void SplitAt(size_t pos, TdSelf& l, TdSelf& r) const noexcept {
293
- SplitOn(pos, l, r, 0);
294
- }
295
-
296
- /*
297
- // Not implemented intentionally, use TrySplitOn() instead
298
- void RSplitOn(size_t pos, TdSelf& l, TdSelf& r) const noexcept;
299
- void RSplitAt(size_t pos, TdSelf& l, TdSelf& r) const noexcept;
300
- */
301
-
302
- public:
303
- Y_PURE_FUNCTION
304
- inline TdSelf After(TCharType c) const noexcept {
305
- TdSelf l, r;
306
- return TrySplit(c, l, r) ? r : *this;
307
- }
308
-
309
- Y_PURE_FUNCTION
310
- inline TdSelf Before(TCharType c) const noexcept {
311
- TdSelf l, r;
312
- return TrySplit(c, l, r) ? l : *this;
313
- }
314
-
315
- Y_PURE_FUNCTION
316
- inline TdSelf RAfter(TCharType c) const noexcept {
317
- TdSelf l, r;
318
- return TryRSplit(c, l, r) ? r : *this;
319
- }
320
-
321
- Y_PURE_FUNCTION
322
- inline TdSelf RBefore(TCharType c) const noexcept {
323
- TdSelf l, r;
324
- return TryRSplit(c, l, r) ? l : *this;
325
- }
326
-
327
- public:
328
- inline bool AfterPrefix(const TdSelf& prefix, TdSelf& result) const noexcept {
329
- if (this->StartsWith(prefix)) {
330
- result = Tail(prefix.size());
331
- return true;
332
- }
333
- return false;
334
- }
335
-
336
- inline bool BeforeSuffix(const TdSelf& suffix, TdSelf& result) const noexcept {
337
- if (this->EndsWith(suffix)) {
338
- result = Head(size() - suffix.size());
339
- return true;
340
- }
341
- return false;
342
- }
343
-
344
- // returns true if string started with `prefix`, false otherwise
345
- inline bool SkipPrefix(const TdSelf& prefix) noexcept {
346
- return AfterPrefix(prefix, *this);
347
- }
348
-
349
- // returns true if string ended with `suffix`, false otherwise
350
- inline bool ChopSuffix(const TdSelf& suffix) noexcept {
351
- return BeforeSuffix(suffix, *this);
352
- }
353
-
354
- public:
355
- // returns tail, including pos
356
- TdSelf SplitOffAt(size_t pos) {
357
- const TdSelf tok = SubStr(pos);
358
- Trunc(pos);
359
- return tok;
360
- }
361
-
362
- // returns head, tail includes pos
363
- TdSelf NextTokAt(size_t pos) {
364
- const TdSelf tok = Head(pos);
365
- Skip(pos);
366
- return tok;
367
- }
368
-
369
- TdSelf SplitOffOn(size_t pos) {
370
- TdSelf tok;
371
- SplitOn(pos, *this, tok);
372
- return tok;
373
- }
374
-
375
- TdSelf NextTokOn(size_t pos) {
376
- TdSelf tok;
377
- SplitOn(pos, tok, *this);
378
- return tok;
379
- }
380
- /*
381
- // See comment on RSplitOn() above
382
- TdSelf RSplitOffOn(size_t pos);
383
- TdSelf RNextTokOn(size_t pos);
384
- */
385
-
386
- public:
387
- TdSelf SplitOff(TCharType delim) {
388
- TdSelf tok;
389
- Split(delim, *this, tok);
390
- return tok;
391
- }
392
-
393
- TdSelf RSplitOff(TCharType delim) {
394
- TdSelf tok;
395
- RSplit(delim, tok, *this);
396
- return tok;
397
- }
398
-
399
- bool NextTok(TCharType delim, TdSelf& tok) {
400
- return NextTokTemplate(delim, tok);
401
- }
402
-
403
- bool NextTok(TdSelf delim, TdSelf& tok) {
404
- return NextTokTemplate(delim, tok);
405
- }
406
-
407
- bool RNextTok(TCharType delim, TdSelf& tok) {
408
- return RNextTokTemplate(delim, tok);
409
- }
410
-
411
- bool RNextTok(TdSelf delim, TdSelf& tok) {
412
- return RNextTokTemplate(delim, tok);
413
- }
414
-
415
- bool ReadLine(TdSelf& tok) {
416
- if (NextTok('\n', tok)) {
417
- while (!tok.empty() && tok.back() == '\r') {
418
- tok.remove_suffix(1);
419
- }
420
-
421
- return true;
422
- }
423
-
424
- return false;
425
- }
426
-
427
- TdSelf NextTok(TCharType delim) {
428
- return NextTokTemplate(delim);
429
- }
430
-
431
- TdSelf RNextTok(TCharType delim) {
432
- return RNextTokTemplate(delim);
433
- }
434
-
435
- TdSelf NextTok(TdSelf delim) {
436
- return NextTokTemplate(delim);
437
- }
438
-
439
- TdSelf RNextTok(TdSelf delim) {
440
- return RNextTokTemplate(delim);
441
- }
442
-
443
- public: // string subsequences
444
- /// Cut last @c shift characters (or less if length is less than @c shift)
445
- inline TdSelf& Chop(size_t shift) noexcept {
446
- this->remove_suffix(std::min(shift, size()));
447
- return *this;
448
- }
449
-
450
- /// Cut first @c shift characters (or less if length is less than @c shift)
451
- inline TdSelf& Skip(size_t shift) noexcept {
452
- this->remove_prefix(std::min(shift, size()));
453
- return *this;
454
- }
455
-
456
- /// Sets the start pointer to a position relative to the end
457
- inline TdSelf& RSeek(size_t tailSize) noexcept {
458
- if (size() > tailSize) {
459
- //WARN: removing TStringView:: will lead to an infinite recursion
460
- *this = TStringView::substr(size() - tailSize, tailSize);
461
- }
462
-
463
- return *this;
464
- }
465
-
466
- inline TdSelf& Trunc(size_t targetSize) noexcept {
467
- //WARN: removing TStringView:: will lead to an infinite recursion
468
- *this = TStringView::substr(0, targetSize);
469
- return *this;
470
- }
471
-
472
- Y_PURE_FUNCTION
473
- inline TdSelf SubStr(size_t beg) const noexcept {
474
- return TdSelf(*this).Skip(beg);
475
- }
476
-
477
- Y_PURE_FUNCTION
478
- inline TdSelf SubStr(size_t beg, size_t len) const noexcept {
479
- return SubStr(beg).Trunc(len);
480
- }
481
-
482
- Y_PURE_FUNCTION
483
- inline TdSelf Head(size_t pos) const noexcept {
484
- return TdSelf(*this).Trunc(pos);
485
- }
486
-
487
- Y_PURE_FUNCTION
488
- inline TdSelf Tail(size_t pos) const noexcept {
489
- return SubStr(pos);
490
- }
491
-
492
- Y_PURE_FUNCTION
493
- inline TdSelf Last(size_t len) const noexcept {
494
- return TdSelf(*this).RSeek(len);
495
- }
496
-
497
- private:
498
- template <typename TDelimiterType>
499
- TdSelf NextTokTemplate(TDelimiterType delim) {
500
- TdSelf tok;
501
- Split(delim, tok, *this);
502
- return tok;
503
- }
504
-
505
- template <typename TDelimiterType>
506
- TdSelf RNextTokTemplate(TDelimiterType delim) {
507
- TdSelf tok;
508
- RSplit(delim, *this, tok);
509
- return tok;
510
- }
511
-
512
- template <typename TDelimiterType>
513
- bool NextTokTemplate(TDelimiterType delim, TdSelf& tok) {
514
- if (!empty()) {
515
- tok = NextTokTemplate(delim);
516
- return true;
517
- }
518
- return false;
519
- }
520
-
521
- template <typename TDelimiterType>
522
- bool RNextTokTemplate(TDelimiterType delim, TdSelf& tok) {
523
- if (!empty()) {
524
- tok = RNextTokTemplate(delim);
525
- return true;
526
- }
527
- return false;
528
- }
529
-
530
- template <typename TDelimiterType>
531
- inline void SplitTemplate(TDelimiterType delim, TdSelf& l, TdSelf& r) const noexcept {
532
- if (!TrySplit(delim, l, r)) {
533
- l = *this;
534
- r = TdSelf();
535
- }
536
- }
537
-
538
- template <typename TDelimiterType>
539
- inline void RSplitTemplate(TDelimiterType delim, TdSelf& l, TdSelf& r) const noexcept {
540
- if (!TryRSplit(delim, l, r)) {
541
- r = *this;
542
- l = TdSelf();
543
- }
544
- }
545
- };
546
-
547
- std::ostream& operator<< (std::ostream& os, TStringBuf buf);
548
-
549
- template <typename TCharType, size_t size>
550
- constexpr inline TBasicStringBuf<TCharType> AsStringBuf(const TCharType (&str)[size]) noexcept {
551
- return TBasicStringBuf<TCharType>(str, size - 1);
552
- }
@@ -1,17 +0,0 @@
1
- #pragma once
2
-
3
- /*
4
- * strfcpy is a faster version of strlcpy().
5
- * It returns void thus does not wastes time computing
6
- * (most likely, unneeded) strlen(str)
7
- *
8
- * Comparison with other copying functions:
9
- * strcpy() - buffer overflow ready
10
- * strncpy() - wastes time filling exactly n bytes with 0
11
- * strlcpy() - wastes time searching for the length of src
12
- * memcpy() - wastes time copying exactly n bytes even if the string is shorter
13
- */
14
-
15
- #include <stddef.h>
16
-
17
- void strfcpy(char* dst, const char* src, size_t n);