catboost 1.25.1 → 1.27.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (290) hide show
  1. package/DEPLOYMENT.md +22 -15
  2. package/README.md +43 -27
  3. package/binding.gyp +5 -7
  4. package/build_scripts/bootstrap.js +2 -1
  5. package/build_scripts/out/build.js +46 -68
  6. package/build_scripts/out/build_model.js +1 -1
  7. package/build_scripts/out/{build_ya.js → build_native.js} +1 -1
  8. package/build_scripts/out/ci.js +5 -5
  9. package/build_scripts/out/common.js +1 -1
  10. package/build_scripts/out/config.js +32 -18
  11. package/build_scripts/out/install.js +5 -3
  12. package/build_scripts/out/package_prepublish.js +1 -1
  13. package/build_scripts/out/packaging.js +1 -19
  14. package/build_scripts/out/run_tests.js +1 -1
  15. package/build_scripts/out/test.js +8 -3
  16. package/config.json +18 -11
  17. package/inc/catboost/libs/model_interface/c_api.h +367 -5
  18. package/lib/catboost.d.ts +65 -21
  19. package/package.json +4 -4
  20. package/src/api_helpers.cpp +100 -24
  21. package/src/api_helpers.h +8 -7
  22. package/src/api_module.cpp +1 -2
  23. package/src/model.cpp +483 -83
  24. package/src/model.h +24 -9
  25. package/inc/contrib/libs/cxxsupp/system_stl/include/stlfwd +0 -14
  26. package/inc/util/charset/recode_result.h +0 -9
  27. package/inc/util/charset/unicode_table.h +0 -123
  28. package/inc/util/charset/unidata.h +0 -421
  29. package/inc/util/charset/utf8.h +0 -384
  30. package/inc/util/charset/wide.h +0 -843
  31. package/inc/util/charset/wide_specific.h +0 -22
  32. package/inc/util/datetime/base.h +0 -669
  33. package/inc/util/datetime/constants.h +0 -7
  34. package/inc/util/datetime/cputimer.h +0 -124
  35. package/inc/util/datetime/parser.h +0 -292
  36. package/inc/util/datetime/systime.h +0 -47
  37. package/inc/util/datetime/uptime.h +0 -8
  38. package/inc/util/digest/city.h +0 -88
  39. package/inc/util/digest/fnv.h +0 -73
  40. package/inc/util/digest/multi.h +0 -14
  41. package/inc/util/digest/murmur.h +0 -57
  42. package/inc/util/digest/numeric.h +0 -86
  43. package/inc/util/digest/sequence.h +0 -48
  44. package/inc/util/draft/date.h +0 -129
  45. package/inc/util/draft/datetime.h +0 -184
  46. package/inc/util/draft/enum.h +0 -136
  47. package/inc/util/draft/holder_vector.h +0 -102
  48. package/inc/util/draft/ip.h +0 -131
  49. package/inc/util/draft/matrix.h +0 -108
  50. package/inc/util/draft/memory.h +0 -40
  51. package/inc/util/folder/dirent_win.h +0 -46
  52. package/inc/util/folder/dirut.h +0 -121
  53. package/inc/util/folder/filelist.h +0 -81
  54. package/inc/util/folder/fts.h +0 -108
  55. package/inc/util/folder/iterator.h +0 -109
  56. package/inc/util/folder/lstat_win.h +0 -20
  57. package/inc/util/folder/path.h +0 -225
  58. package/inc/util/folder/pathsplit.h +0 -113
  59. package/inc/util/folder/tempdir.h +0 -42
  60. package/inc/util/generic/adaptor.h +0 -134
  61. package/inc/util/generic/algorithm.h +0 -765
  62. package/inc/util/generic/array_ref.h +0 -282
  63. package/inc/util/generic/array_size.h +0 -24
  64. package/inc/util/generic/benchmark/vector_count_ctor/f.h +0 -9
  65. package/inc/util/generic/bitmap.h +0 -1115
  66. package/inc/util/generic/bitops.h +0 -459
  67. package/inc/util/generic/bt_exception.h +0 -24
  68. package/inc/util/generic/buffer.h +0 -232
  69. package/inc/util/generic/cast.h +0 -176
  70. package/inc/util/generic/deque.h +0 -24
  71. package/inc/util/generic/explicit_type.h +0 -42
  72. package/inc/util/generic/fastqueue.h +0 -55
  73. package/inc/util/generic/flags.h +0 -244
  74. package/inc/util/generic/function.h +0 -103
  75. package/inc/util/generic/fwd.h +0 -171
  76. package/inc/util/generic/guid.h +0 -61
  77. package/inc/util/generic/hash.h +0 -2032
  78. package/inc/util/generic/hash_primes.h +0 -140
  79. package/inc/util/generic/hash_set.h +0 -490
  80. package/inc/util/generic/hide_ptr.h +0 -3
  81. package/inc/util/generic/intrlist.h +0 -876
  82. package/inc/util/generic/is_in.h +0 -53
  83. package/inc/util/generic/iterator.h +0 -137
  84. package/inc/util/generic/iterator_range.h +0 -105
  85. package/inc/util/generic/lazy_value.h +0 -66
  86. package/inc/util/generic/list.h +0 -22
  87. package/inc/util/generic/map.h +0 -44
  88. package/inc/util/generic/mapfindptr.h +0 -60
  89. package/inc/util/generic/maybe.h +0 -713
  90. package/inc/util/generic/maybe_traits.h +0 -164
  91. package/inc/util/generic/mem_copy.h +0 -55
  92. package/inc/util/generic/noncopyable.h +0 -38
  93. package/inc/util/generic/object_counter.h +0 -53
  94. package/inc/util/generic/ptr.h +0 -1113
  95. package/inc/util/generic/queue.h +0 -57
  96. package/inc/util/generic/refcount.h +0 -162
  97. package/inc/util/generic/reserve.h +0 -11
  98. package/inc/util/generic/scope.h +0 -65
  99. package/inc/util/generic/serialized_enum.h +0 -406
  100. package/inc/util/generic/set.h +0 -42
  101. package/inc/util/generic/singleton.h +0 -136
  102. package/inc/util/generic/size_literals.h +0 -65
  103. package/inc/util/generic/stack.h +0 -18
  104. package/inc/util/generic/store_policy.h +0 -120
  105. package/inc/util/generic/strbase.h +0 -612
  106. package/inc/util/generic/strbuf.h +0 -552
  107. package/inc/util/generic/strfcpy.h +0 -17
  108. package/inc/util/generic/string.h +0 -1572
  109. package/inc/util/generic/string_hash.h +0 -21
  110. package/inc/util/generic/string_ut.h +0 -1175
  111. package/inc/util/generic/type_name.h +0 -34
  112. package/inc/util/generic/typelist.h +0 -114
  113. package/inc/util/generic/typetraits.h +0 -325
  114. package/inc/util/generic/utility.h +0 -132
  115. package/inc/util/generic/va_args.h +0 -400
  116. package/inc/util/generic/variant.h +0 -631
  117. package/inc/util/generic/variant_traits.h +0 -171
  118. package/inc/util/generic/vector.h +0 -119
  119. package/inc/util/generic/xrange.h +0 -258
  120. package/inc/util/generic/yexception.h +0 -212
  121. package/inc/util/generic/yexception_ut.h +0 -14
  122. package/inc/util/generic/ylimits.h +0 -92
  123. package/inc/util/generic/ymath.h +0 -206
  124. package/inc/util/memory/addstorage.h +0 -93
  125. package/inc/util/memory/alloc.h +0 -27
  126. package/inc/util/memory/blob.h +0 -296
  127. package/inc/util/memory/mmapalloc.h +0 -8
  128. package/inc/util/memory/pool.h +0 -432
  129. package/inc/util/memory/segmented_string_pool.h +0 -194
  130. package/inc/util/memory/segpool_alloc.h +0 -118
  131. package/inc/util/memory/smallobj.h +0 -141
  132. package/inc/util/memory/tempbuf.h +0 -111
  133. package/inc/util/network/address.h +0 -136
  134. package/inc/util/network/endpoint.h +0 -61
  135. package/inc/util/network/hostip.h +0 -16
  136. package/inc/util/network/init.h +0 -60
  137. package/inc/util/network/interface.h +0 -17
  138. package/inc/util/network/iovec.h +0 -65
  139. package/inc/util/network/ip.h +0 -116
  140. package/inc/util/network/nonblock.h +0 -8
  141. package/inc/util/network/pair.h +0 -9
  142. package/inc/util/network/poller.h +0 -58
  143. package/inc/util/network/pollerimpl.h +0 -707
  144. package/inc/util/network/sock.h +0 -608
  145. package/inc/util/network/socket.h +0 -421
  146. package/inc/util/random/common_ops.h +0 -130
  147. package/inc/util/random/easy.h +0 -47
  148. package/inc/util/random/entropy.h +0 -21
  149. package/inc/util/random/fast.h +0 -101
  150. package/inc/util/random/init_atfork.h +0 -3
  151. package/inc/util/random/lcg_engine.h +0 -66
  152. package/inc/util/random/mersenne.h +0 -46
  153. package/inc/util/random/mersenne32.h +0 -50
  154. package/inc/util/random/mersenne64.h +0 -50
  155. package/inc/util/random/normal.h +0 -38
  156. package/inc/util/random/random.h +0 -30
  157. package/inc/util/random/shuffle.h +0 -39
  158. package/inc/util/str_stl.h +0 -266
  159. package/inc/util/stream/aligned.h +0 -99
  160. package/inc/util/stream/buffer.h +0 -119
  161. package/inc/util/stream/buffered.h +0 -225
  162. package/inc/util/stream/debug.h +0 -53
  163. package/inc/util/stream/direct_io.h +0 -43
  164. package/inc/util/stream/file.h +0 -108
  165. package/inc/util/stream/format.h +0 -444
  166. package/inc/util/stream/fwd.h +0 -100
  167. package/inc/util/stream/hex.h +0 -8
  168. package/inc/util/stream/holder.h +0 -44
  169. package/inc/util/stream/input.h +0 -273
  170. package/inc/util/stream/labeled.h +0 -19
  171. package/inc/util/stream/length.h +0 -100
  172. package/inc/util/stream/mem.h +0 -255
  173. package/inc/util/stream/multi.h +0 -32
  174. package/inc/util/stream/null.h +0 -61
  175. package/inc/util/stream/output.h +0 -304
  176. package/inc/util/stream/pipe.h +0 -112
  177. package/inc/util/stream/printf.h +0 -25
  178. package/inc/util/stream/str.h +0 -207
  179. package/inc/util/stream/tee.h +0 -28
  180. package/inc/util/stream/tempbuf.h +0 -21
  181. package/inc/util/stream/tokenizer.h +0 -214
  182. package/inc/util/stream/trace.h +0 -60
  183. package/inc/util/stream/walk.h +0 -35
  184. package/inc/util/stream/zerocopy.h +0 -91
  185. package/inc/util/stream/zerocopy_output.h +0 -57
  186. package/inc/util/stream/zlib.h +0 -173
  187. package/inc/util/string/ascii.h +0 -236
  188. package/inc/util/string/builder.h +0 -39
  189. package/inc/util/string/cast.h +0 -347
  190. package/inc/util/string/cstriter.h +0 -14
  191. package/inc/util/string/escape.h +0 -70
  192. package/inc/util/string/hex.h +0 -59
  193. package/inc/util/string/join.h +0 -194
  194. package/inc/util/string/printf.h +0 -13
  195. package/inc/util/string/reverse.h +0 -16
  196. package/inc/util/string/split.h +0 -1080
  197. package/inc/util/string/strip.h +0 -257
  198. package/inc/util/string/strspn.h +0 -65
  199. package/inc/util/string/subst.h +0 -56
  200. package/inc/util/string/type.h +0 -50
  201. package/inc/util/string/util.h +0 -195
  202. package/inc/util/string/vector.h +0 -132
  203. package/inc/util/system/align.h +0 -50
  204. package/inc/util/system/atexit.h +0 -22
  205. package/inc/util/system/atomic.h +0 -51
  206. package/inc/util/system/atomic_gcc.h +0 -90
  207. package/inc/util/system/atomic_ops.h +0 -189
  208. package/inc/util/system/atomic_win.h +0 -114
  209. package/inc/util/system/backtrace.h +0 -39
  210. package/inc/util/system/byteorder.h +0 -186
  211. package/inc/util/system/compat.h +0 -84
  212. package/inc/util/system/compiler.h +0 -620
  213. package/inc/util/system/condvar.h +0 -71
  214. package/inc/util/system/context.h +0 -181
  215. package/inc/util/system/context_aarch64.h +0 -8
  216. package/inc/util/system/context_i686.h +0 -9
  217. package/inc/util/system/context_x86.h +0 -12
  218. package/inc/util/system/context_x86_64.h +0 -7
  219. package/inc/util/system/cpu_id.h +0 -159
  220. package/inc/util/system/daemon.h +0 -28
  221. package/inc/util/system/datetime.h +0 -98
  222. package/inc/util/system/defaults.h +0 -149
  223. package/inc/util/system/demangle.h +0 -5
  224. package/inc/util/system/demangle_impl.h +0 -23
  225. package/inc/util/system/direct_io.h +0 -71
  226. package/inc/util/system/dynlib.h +0 -119
  227. package/inc/util/system/env.h +0 -32
  228. package/inc/util/system/error.h +0 -95
  229. package/inc/util/system/event.h +0 -122
  230. package/inc/util/system/execpath.h +0 -17
  231. package/inc/util/system/fasttime.h +0 -6
  232. package/inc/util/system/fhandle.h +0 -27
  233. package/inc/util/system/file.h +0 -210
  234. package/inc/util/system/file_lock.h +0 -34
  235. package/inc/util/system/filemap.h +0 -383
  236. package/inc/util/system/flock.h +0 -35
  237. package/inc/util/system/fs.h +0 -156
  238. package/inc/util/system/fs_win.h +0 -29
  239. package/inc/util/system/fstat.h +0 -46
  240. package/inc/util/system/getpid.h +0 -12
  241. package/inc/util/system/guard.h +0 -179
  242. package/inc/util/system/hi_lo.h +0 -139
  243. package/inc/util/system/hostname.h +0 -10
  244. package/inc/util/system/hp_timer.h +0 -36
  245. package/inc/util/system/info.h +0 -12
  246. package/inc/util/system/interrupt_signals.h +0 -22
  247. package/inc/util/system/madvise.h +0 -30
  248. package/inc/util/system/maxlen.h +0 -32
  249. package/inc/util/system/mem_info.h +0 -18
  250. package/inc/util/system/mincore.h +0 -38
  251. package/inc/util/system/mktemp.h +0 -11
  252. package/inc/util/system/mlock.h +0 -43
  253. package/inc/util/system/mutex.h +0 -67
  254. package/inc/util/system/nice.h +0 -3
  255. package/inc/util/system/pipe.h +0 -90
  256. package/inc/util/system/platform.h +0 -246
  257. package/inc/util/system/progname.h +0 -13
  258. package/inc/util/system/protect.h +0 -25
  259. package/inc/util/system/rusage.h +0 -26
  260. package/inc/util/system/rwlock.h +0 -78
  261. package/inc/util/system/sanitizers.h +0 -122
  262. package/inc/util/system/sem.h +0 -41
  263. package/inc/util/system/shellcommand.h +0 -472
  264. package/inc/util/system/shmat.h +0 -32
  265. package/inc/util/system/sigset.h +0 -78
  266. package/inc/util/system/spin_wait.h +0 -10
  267. package/inc/util/system/spinlock.h +0 -121
  268. package/inc/util/system/src_location.h +0 -25
  269. package/inc/util/system/src_root.h +0 -68
  270. package/inc/util/system/sys_alloc.h +0 -43
  271. package/inc/util/system/sysstat.h +0 -52
  272. package/inc/util/system/tempfile.h +0 -34
  273. package/inc/util/system/thread.h +0 -167
  274. package/inc/util/system/tls.h +0 -307
  275. package/inc/util/system/types.h +0 -119
  276. package/inc/util/system/unaligned_mem.h +0 -67
  277. package/inc/util/system/user.h +0 -5
  278. package/inc/util/system/utime.h +0 -6
  279. package/inc/util/system/valgrind.h +0 -48
  280. package/inc/util/system/winint.h +0 -43
  281. package/inc/util/system/yassert.h +0 -121
  282. package/inc/util/system/yield.h +0 -4
  283. package/inc/util/thread/factory.h +0 -65
  284. package/inc/util/thread/fwd.h +0 -30
  285. package/inc/util/thread/lfqueue.h +0 -406
  286. package/inc/util/thread/lfstack.h +0 -188
  287. package/inc/util/thread/pool.h +0 -388
  288. package/inc/util/thread/singleton.h +0 -42
  289. package/inc/util/ysafeptr.h +0 -427
  290. package/inc/util/ysaveload.h +0 -700
@@ -1,552 +0,0 @@
1
- #pragma once
2
-
3
- #include "fwd.h"
4
- #include "strbase.h"
5
- #include "utility.h"
6
- #include "typetraits.h"
7
-
8
- #include <string_view>
9
-
10
- template <typename TCharType, typename TTraits>
11
- class TBasicStringBuf:
12
- public std::basic_string_view<TCharType>,
13
- public TStringBase<TBasicStringBuf<TCharType, TTraits>, TCharType, TTraits>
14
- {
15
- private:
16
- using TdSelf = TBasicStringBuf;
17
- using TBase = TStringBase<TdSelf, TCharType, TTraits>;
18
- using TStringView = std::basic_string_view<TCharType>;
19
-
20
- public:
21
- using char_type = TCharType; // TODO: DROP
22
- using traits_type = TTraits;
23
-
24
- //Resolving some ambiguity between TStringBase and std::basic_string_view
25
- //for typenames
26
- using typename TStringView::size_type;
27
- using typename TStringView::value_type;
28
- using typename TStringView::iterator;
29
- using typename TStringView::const_iterator;
30
- using typename TStringView::reverse_iterator;
31
- using typename TStringView::const_reverse_iterator;
32
- using typename TStringView::reference;
33
- using typename TStringView::const_reference;
34
-
35
- //for constants
36
- using TStringView::npos;
37
-
38
- //for methods and operators
39
- using TStringView::begin;
40
- using TStringView::end;
41
- using TStringView::cbegin;
42
- using TStringView::cend;
43
- using TStringView::rbegin;
44
- using TStringView::rend;
45
- using TStringView::crbegin;
46
- using TStringView::crend;
47
-
48
- using TStringView::size;
49
- using TStringView::empty;
50
- using TStringView::data;
51
-
52
- using TStringView::operator[];
53
-
54
- /*
55
- * WARN:
56
- * TBase::at silently return 0 in case of range error,
57
- * while std::string_view throws std::out_of_range.
58
- */
59
- using TBase::at;
60
- using TStringView::front;
61
- using TStringView::back;
62
-
63
- using TStringView::find;
64
- /*
65
- * WARN:
66
- * TBase::*find* methods take into account TCharTraits,
67
- * while TTStringView::*find* would use default std::char_traits.
68
- */
69
- using TBase::rfind;
70
- using TBase::find_first_of;
71
- using TBase::find_first_not_of;
72
- using TBase::find_last_of;
73
- using TBase::find_last_not_of;
74
-
75
- using TStringView::copy;
76
- /*
77
- * WARN:
78
- * TBase::compare takes into account TCharTraits,
79
- * thus making it possible to implement case-insensitive string buffers,
80
- * if it is using TStringBase::compare
81
- */
82
- using TBase::compare;
83
-
84
- /*
85
- * WARN:
86
- * TBase::substr properly checks boundary cases and clamps them with maximum valid values,
87
- * while TStringView::substr throws std::out_of_range error.
88
- */
89
- using TBase::substr;
90
-
91
- /*
92
- * WARN:
93
- * Constructing std::string_view(nullptr, non_zero_size) ctor
94
- * results in undefined behavior according to the standard.
95
- * In libc++ this UB results in runtime assertion, though it is better
96
- * to generate compilation error instead.
97
- */
98
- constexpr inline TBasicStringBuf(std::nullptr_t begin, size_t size) = delete;
99
-
100
- constexpr inline TBasicStringBuf(const TCharType* data, size_t size) noexcept
101
- : TStringView(data, size)
102
- {
103
- }
104
-
105
- _LIBCPP_CONSTEXPR_AFTER_CXX14
106
- inline TBasicStringBuf(const TCharType* data) noexcept
107
- /*
108
- * WARN: TBase::StrLen properly handles nullptr,
109
- * while std::string_view (using std::char_traits) will abort in such case
110
- */
111
- : TStringView(data, TBase::StrLen(data))
112
- {
113
- }
114
-
115
- constexpr inline TBasicStringBuf(const TCharType* beg, const TCharType* end) noexcept
116
- : TStringView(beg, end - beg)
117
- {
118
- }
119
-
120
- template <typename D, typename T>
121
- inline TBasicStringBuf(const TStringBase<D, TCharType, T>& str) noexcept
122
- : TStringView(str.data(), str.size())
123
- {
124
- }
125
-
126
- template <typename T, typename A>
127
- inline TBasicStringBuf(const std::basic_string<TCharType, T, A>& str) noexcept
128
- : TStringView(str)
129
- {
130
- }
131
-
132
- template <typename TCharTraits>
133
- constexpr TBasicStringBuf(std::basic_string_view<TCharType, TCharTraits> view) noexcept
134
- : TStringView(view)
135
- {
136
- }
137
-
138
- constexpr inline TBasicStringBuf() noexcept
139
- {
140
- /*
141
- * WARN:
142
- * This ctor can not be defaulted due to the following feature of default initialization:
143
- * If T is a const-qualified type, it must be a class type with a user-provided default constructor.
144
- * (see https://en.cppreference.com/w/cpp/language/default_initialization).
145
- *
146
- * This means, that a class with default ctor can not be a constant member of another class with default ctor.
147
- */
148
- }
149
-
150
- inline TBasicStringBuf(const TBasicStringBuf& src, size_t pos, size_t n) noexcept
151
- : TBasicStringBuf(src)
152
- {
153
- Skip(pos).Trunc(n);
154
- }
155
-
156
- inline TBasicStringBuf(const TBasicStringBuf& src, size_t pos) noexcept
157
- : TBasicStringBuf(src, pos, TBase::npos)
158
- {
159
- }
160
-
161
- Y_PURE_FUNCTION
162
- inline TBasicStringBuf SubString(size_t pos, size_t n) const noexcept {
163
- pos = Min(pos, size());
164
- n = Min(n, size() - pos);
165
- return TBasicStringBuf(data() + pos, n);
166
- }
167
-
168
- public:
169
- void Clear() {
170
- *this = TdSelf();
171
- }
172
-
173
- constexpr bool IsInited() const noexcept {
174
- return data() != nullptr;
175
- }
176
-
177
- public:
178
- /**
179
- * Tries to split string in two parts using given delimiter character.
180
- * Searches for the delimiter, scanning string from the beginning.
181
- * The delimiter is excluded from the result. Both out parameters are
182
- * left unmodified if there was no delimiter character in string.
183
- *
184
- * @param[in] delim Delimiter character.
185
- * @param[out] l The first part of split result.
186
- * @param[out] r The second part of split result.
187
- * @returns Whether the split was actually performed.
188
- */
189
- inline bool TrySplit(TCharType delim, TdSelf& l, TdSelf& r) const noexcept {
190
- return TrySplitOn(TBase::find(delim), l, r);
191
- }
192
-
193
- /**
194
- * Tries to split string in two parts using given delimiter character.
195
- * Searches for the delimiter, scanning string from the end.
196
- * The delimiter is excluded from the result. Both out parameters are
197
- * left unmodified if there was no delimiter character in string.
198
- *
199
- * @param[in] delim Delimiter character.
200
- * @param[out] l The first part of split result.
201
- * @param[out] r The second part of split result.
202
- * @returns Whether the split was actually performed.
203
- */
204
- inline bool TryRSplit(TCharType delim, TdSelf& l, TdSelf& r) const noexcept {
205
- return TrySplitOn(TBase::rfind(delim), l, r);
206
- }
207
-
208
- /**
209
- * Tries to split string in two parts using given delimiter sequence.
210
- * Searches for the delimiter, scanning string from the beginning.
211
- * The delimiter sequence is excluded from the result. Both out parameters
212
- * are left unmodified if there was no delimiter character in string.
213
- *
214
- * @param[in] delim Delimiter sequence.
215
- * @param[out] l The first part of split result.
216
- * @param[out] r The second part of split result.
217
- * @returns Whether the split was actually performed.
218
- */
219
- inline bool TrySplit(TdSelf delim, TdSelf& l, TdSelf& r) const noexcept {
220
- return TrySplitOn(TBase::find(delim), l, r, delim.size());
221
- }
222
-
223
- /**
224
- * Tries to split string in two parts using given delimiter sequence.
225
- * Searches for the delimiter, scanning string from the end.
226
- * The delimiter sequence is excluded from the result. Both out parameters
227
- * are left unmodified if there was no delimiter character in string.
228
- *
229
- * @param[in] delim Delimiter sequence.
230
- * @param[out] l The first part of split result.
231
- * @param[out] r The second part of split result.
232
- * @returns Whether the split was actually performed.
233
- */
234
- inline bool TryRSplit(TdSelf delim, TdSelf& l, TdSelf& r) const noexcept {
235
- return TrySplitOn(TBase::rfind(delim), l, r, delim.size());
236
- }
237
-
238
- inline void Split(TCharType delim, TdSelf& l, TdSelf& r) const noexcept {
239
- SplitTemplate(delim, l, r);
240
- }
241
-
242
- inline void RSplit(TCharType delim, TdSelf& l, TdSelf& r) const noexcept {
243
- RSplitTemplate(delim, l, r);
244
- }
245
-
246
- inline void Split(TdSelf delim, TdSelf& l, TdSelf& r) const noexcept {
247
- SplitTemplate(delim, l, r);
248
- }
249
-
250
- inline void RSplit(TdSelf delim, TdSelf& l, TdSelf& r) const noexcept {
251
- RSplitTemplate(delim, l, r);
252
- }
253
-
254
- private:
255
- // splits on a delimiter at a given position; delimiter is excluded
256
- void DoSplitOn(size_t pos, TdSelf& l, TdSelf& r, size_t len) const noexcept {
257
- Y_ASSERT(pos != TBase::npos);
258
-
259
- // make a copy in case one of l/r is really *this
260
- const TdSelf tok = SubStr(pos + len);
261
- l = Head(pos);
262
- r = tok;
263
- }
264
-
265
- public:
266
- // In all methods below with @pos parameter, @pos is supposed to be
267
- // a result of string find()/rfind()/find_first() or other similiar functions,
268
- // returning either position within string length [0..size()) or npos.
269
- // For all other @pos values (out of string index range) the behaviour isn't well defined
270
- // For example, for TStringBuf s("abc"):
271
- // s.TrySplitOn(s.find('z'), ...) is false, but s.TrySplitOn(100500, ...) is true.
272
-
273
- bool TrySplitOn(size_t pos, TdSelf& l, TdSelf& r, size_t len = 1) const noexcept {
274
- if (TBase::npos == pos)
275
- return false;
276
-
277
- DoSplitOn(pos, l, r, len);
278
- return true;
279
- }
280
-
281
- void SplitOn(size_t pos, TdSelf& l, TdSelf& r, size_t len = 1) const noexcept {
282
- if (!TrySplitOn(pos, l, r, len)) {
283
- l = *this;
284
- r = TdSelf();
285
- }
286
- }
287
-
288
- bool TrySplitAt(size_t pos, TdSelf& l, TdSelf& r) const noexcept {
289
- return TrySplitOn(pos, l, r, 0);
290
- }
291
-
292
- void SplitAt(size_t pos, TdSelf& l, TdSelf& r) const noexcept {
293
- SplitOn(pos, l, r, 0);
294
- }
295
-
296
- /*
297
- // Not implemented intentionally, use TrySplitOn() instead
298
- void RSplitOn(size_t pos, TdSelf& l, TdSelf& r) const noexcept;
299
- void RSplitAt(size_t pos, TdSelf& l, TdSelf& r) const noexcept;
300
- */
301
-
302
- public:
303
- Y_PURE_FUNCTION
304
- inline TdSelf After(TCharType c) const noexcept {
305
- TdSelf l, r;
306
- return TrySplit(c, l, r) ? r : *this;
307
- }
308
-
309
- Y_PURE_FUNCTION
310
- inline TdSelf Before(TCharType c) const noexcept {
311
- TdSelf l, r;
312
- return TrySplit(c, l, r) ? l : *this;
313
- }
314
-
315
- Y_PURE_FUNCTION
316
- inline TdSelf RAfter(TCharType c) const noexcept {
317
- TdSelf l, r;
318
- return TryRSplit(c, l, r) ? r : *this;
319
- }
320
-
321
- Y_PURE_FUNCTION
322
- inline TdSelf RBefore(TCharType c) const noexcept {
323
- TdSelf l, r;
324
- return TryRSplit(c, l, r) ? l : *this;
325
- }
326
-
327
- public:
328
- inline bool AfterPrefix(const TdSelf& prefix, TdSelf& result) const noexcept {
329
- if (this->StartsWith(prefix)) {
330
- result = Tail(prefix.size());
331
- return true;
332
- }
333
- return false;
334
- }
335
-
336
- inline bool BeforeSuffix(const TdSelf& suffix, TdSelf& result) const noexcept {
337
- if (this->EndsWith(suffix)) {
338
- result = Head(size() - suffix.size());
339
- return true;
340
- }
341
- return false;
342
- }
343
-
344
- // returns true if string started with `prefix`, false otherwise
345
- inline bool SkipPrefix(const TdSelf& prefix) noexcept {
346
- return AfterPrefix(prefix, *this);
347
- }
348
-
349
- // returns true if string ended with `suffix`, false otherwise
350
- inline bool ChopSuffix(const TdSelf& suffix) noexcept {
351
- return BeforeSuffix(suffix, *this);
352
- }
353
-
354
- public:
355
- // returns tail, including pos
356
- TdSelf SplitOffAt(size_t pos) {
357
- const TdSelf tok = SubStr(pos);
358
- Trunc(pos);
359
- return tok;
360
- }
361
-
362
- // returns head, tail includes pos
363
- TdSelf NextTokAt(size_t pos) {
364
- const TdSelf tok = Head(pos);
365
- Skip(pos);
366
- return tok;
367
- }
368
-
369
- TdSelf SplitOffOn(size_t pos) {
370
- TdSelf tok;
371
- SplitOn(pos, *this, tok);
372
- return tok;
373
- }
374
-
375
- TdSelf NextTokOn(size_t pos) {
376
- TdSelf tok;
377
- SplitOn(pos, tok, *this);
378
- return tok;
379
- }
380
- /*
381
- // See comment on RSplitOn() above
382
- TdSelf RSplitOffOn(size_t pos);
383
- TdSelf RNextTokOn(size_t pos);
384
- */
385
-
386
- public:
387
- TdSelf SplitOff(TCharType delim) {
388
- TdSelf tok;
389
- Split(delim, *this, tok);
390
- return tok;
391
- }
392
-
393
- TdSelf RSplitOff(TCharType delim) {
394
- TdSelf tok;
395
- RSplit(delim, tok, *this);
396
- return tok;
397
- }
398
-
399
- bool NextTok(TCharType delim, TdSelf& tok) {
400
- return NextTokTemplate(delim, tok);
401
- }
402
-
403
- bool NextTok(TdSelf delim, TdSelf& tok) {
404
- return NextTokTemplate(delim, tok);
405
- }
406
-
407
- bool RNextTok(TCharType delim, TdSelf& tok) {
408
- return RNextTokTemplate(delim, tok);
409
- }
410
-
411
- bool RNextTok(TdSelf delim, TdSelf& tok) {
412
- return RNextTokTemplate(delim, tok);
413
- }
414
-
415
- bool ReadLine(TdSelf& tok) {
416
- if (NextTok('\n', tok)) {
417
- while (!tok.empty() && tok.back() == '\r') {
418
- tok.remove_suffix(1);
419
- }
420
-
421
- return true;
422
- }
423
-
424
- return false;
425
- }
426
-
427
- TdSelf NextTok(TCharType delim) {
428
- return NextTokTemplate(delim);
429
- }
430
-
431
- TdSelf RNextTok(TCharType delim) {
432
- return RNextTokTemplate(delim);
433
- }
434
-
435
- TdSelf NextTok(TdSelf delim) {
436
- return NextTokTemplate(delim);
437
- }
438
-
439
- TdSelf RNextTok(TdSelf delim) {
440
- return RNextTokTemplate(delim);
441
- }
442
-
443
- public: // string subsequences
444
- /// Cut last @c shift characters (or less if length is less than @c shift)
445
- inline TdSelf& Chop(size_t shift) noexcept {
446
- this->remove_suffix(std::min(shift, size()));
447
- return *this;
448
- }
449
-
450
- /// Cut first @c shift characters (or less if length is less than @c shift)
451
- inline TdSelf& Skip(size_t shift) noexcept {
452
- this->remove_prefix(std::min(shift, size()));
453
- return *this;
454
- }
455
-
456
- /// Sets the start pointer to a position relative to the end
457
- inline TdSelf& RSeek(size_t tailSize) noexcept {
458
- if (size() > tailSize) {
459
- //WARN: removing TStringView:: will lead to an infinite recursion
460
- *this = TStringView::substr(size() - tailSize, tailSize);
461
- }
462
-
463
- return *this;
464
- }
465
-
466
- inline TdSelf& Trunc(size_t targetSize) noexcept {
467
- //WARN: removing TStringView:: will lead to an infinite recursion
468
- *this = TStringView::substr(0, targetSize);
469
- return *this;
470
- }
471
-
472
- Y_PURE_FUNCTION
473
- inline TdSelf SubStr(size_t beg) const noexcept {
474
- return TdSelf(*this).Skip(beg);
475
- }
476
-
477
- Y_PURE_FUNCTION
478
- inline TdSelf SubStr(size_t beg, size_t len) const noexcept {
479
- return SubStr(beg).Trunc(len);
480
- }
481
-
482
- Y_PURE_FUNCTION
483
- inline TdSelf Head(size_t pos) const noexcept {
484
- return TdSelf(*this).Trunc(pos);
485
- }
486
-
487
- Y_PURE_FUNCTION
488
- inline TdSelf Tail(size_t pos) const noexcept {
489
- return SubStr(pos);
490
- }
491
-
492
- Y_PURE_FUNCTION
493
- inline TdSelf Last(size_t len) const noexcept {
494
- return TdSelf(*this).RSeek(len);
495
- }
496
-
497
- private:
498
- template <typename TDelimiterType>
499
- TdSelf NextTokTemplate(TDelimiterType delim) {
500
- TdSelf tok;
501
- Split(delim, tok, *this);
502
- return tok;
503
- }
504
-
505
- template <typename TDelimiterType>
506
- TdSelf RNextTokTemplate(TDelimiterType delim) {
507
- TdSelf tok;
508
- RSplit(delim, *this, tok);
509
- return tok;
510
- }
511
-
512
- template <typename TDelimiterType>
513
- bool NextTokTemplate(TDelimiterType delim, TdSelf& tok) {
514
- if (!empty()) {
515
- tok = NextTokTemplate(delim);
516
- return true;
517
- }
518
- return false;
519
- }
520
-
521
- template <typename TDelimiterType>
522
- bool RNextTokTemplate(TDelimiterType delim, TdSelf& tok) {
523
- if (!empty()) {
524
- tok = RNextTokTemplate(delim);
525
- return true;
526
- }
527
- return false;
528
- }
529
-
530
- template <typename TDelimiterType>
531
- inline void SplitTemplate(TDelimiterType delim, TdSelf& l, TdSelf& r) const noexcept {
532
- if (!TrySplit(delim, l, r)) {
533
- l = *this;
534
- r = TdSelf();
535
- }
536
- }
537
-
538
- template <typename TDelimiterType>
539
- inline void RSplitTemplate(TDelimiterType delim, TdSelf& l, TdSelf& r) const noexcept {
540
- if (!TryRSplit(delim, l, r)) {
541
- r = *this;
542
- l = TdSelf();
543
- }
544
- }
545
- };
546
-
547
- std::ostream& operator<< (std::ostream& os, TStringBuf buf);
548
-
549
- template <typename TCharType, size_t size>
550
- constexpr inline TBasicStringBuf<TCharType> AsStringBuf(const TCharType (&str)[size]) noexcept {
551
- return TBasicStringBuf<TCharType>(str, size - 1);
552
- }
@@ -1,17 +0,0 @@
1
- #pragma once
2
-
3
- /*
4
- * strfcpy is a faster version of strlcpy().
5
- * It returns void thus does not wastes time computing
6
- * (most likely, unneeded) strlen(str)
7
- *
8
- * Comparison with other copying functions:
9
- * strcpy() - buffer overflow ready
10
- * strncpy() - wastes time filling exactly n bytes with 0
11
- * strlcpy() - wastes time searching for the length of src
12
- * memcpy() - wastes time copying exactly n bytes even if the string is shorter
13
- */
14
-
15
- #include <stddef.h>
16
-
17
- void strfcpy(char* dst, const char* src, size_t n);