forked from scylladb/scylladb
-
Notifications
You must be signed in to change notification settings - Fork 0
/
duration.cc
453 lines (358 loc) · 14.9 KB
/
duration.cc
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
/*
* Copyright (C) 2017-present ScyllaDB
*/
/*
* SPDX-License-Identifier: AGPL-3.0-or-later
*/
#include "duration.hh"
#include <boost/lexical_cast.hpp>
#include <seastar/core/format.hh>
#include <cctype>
#include <optional>
#include <limits>
#include <boost/regex.hpp>
#include <sstream>
#include <string>
#include <unordered_map>
namespace {
//
// Helper for retrieving the counter based on knowing its type.
//
template<class Counter>
constexpr typename Counter::value_type& counter_ref(cql_duration &) noexcept;
template<>
constexpr months_counter::value_type& counter_ref<months_counter>(cql_duration &d) noexcept {
return d.months;
}
template<>
constexpr days_counter::value_type& counter_ref<days_counter>(cql_duration &d) noexcept {
return d.days;
}
template<>
constexpr nanoseconds_counter::value_type& counter_ref<nanoseconds_counter>(cql_duration &d) noexcept {
return d.nanoseconds;
}
// Unit for a component of a duration. For example, years.
class duration_unit {
public:
using index_type = uint8_t;
using common_counter_type = cql_duration::common_counter_type;
virtual ~duration_unit() = default;
// Units with larger indices are greater. For example, "months" have a greater index than "days".
virtual index_type index() const noexcept = 0;
virtual const char* short_name() const noexcept = 0;
virtual const char* long_name() const noexcept = 0;
// Increment the appropriate counter in the duration instance based on a count of this unit.
virtual void increment_count(cql_duration&, common_counter_type) const noexcept = 0;
// The remaining capacity (in terms of this unit) of the appropriate counter in the duration instance.
virtual common_counter_type available_count(const cql_duration&) const noexcept = 0;
};
// `_index` is the assigned index of this unit.
// `Counter` is the counter type in the `cql_duration` instance that is used to store this unit.
// `_factor` is the conversion factor of one count of this unit to the corresponding count in `Counter`.
template <uint8_t _index, class Counter, cql_duration::common_counter_type _factor>
class duration_unit_impl : public duration_unit {
public:
static constexpr auto factor = _factor;
virtual ~duration_unit_impl() = default;
index_type index() const noexcept override {
return _index;
}
void increment_count(cql_duration &d, common_counter_type c) const noexcept override {
counter_ref<Counter>(d) += (c * factor);
}
common_counter_type available_count(const cql_duration& d) const noexcept override {
const auto limit = std::numeric_limits<typename Counter::value_type>::max();
return {(limit - counter_ref<Counter>(const_cast<cql_duration&>(d))) / factor};
}
};
struct nanosecond_unit final : public duration_unit_impl<0, nanoseconds_counter , 1> {
const char* short_name() const noexcept override { return "ns"; }
const char* long_name() const noexcept override { return "nanoseconds"; }
} const nanosecond{};
struct microsecond_unit final : public duration_unit_impl<1, nanoseconds_counter, 1000> {
const char* short_name() const noexcept override { return "us"; }
const char* long_name() const noexcept override { return "microseconds"; }
} const microsecond{};
struct millisecond_unit final : public duration_unit_impl<2, nanoseconds_counter, microsecond_unit::factor * 1000> {
const char* short_name() const noexcept override { return "ms"; }
const char* long_name() const noexcept override { return "milliseconds"; }
} const millisecond{};
struct second_unit final : public duration_unit_impl<3, nanoseconds_counter, millisecond_unit::factor * 1000> {
const char* short_name() const noexcept override { return "s"; }
const char* long_name() const noexcept override { return "seconds"; }
} const second{};
struct minute_unit final : public duration_unit_impl<4, nanoseconds_counter, second_unit::factor * 60> {
const char* short_name() const noexcept override { return "m"; }
const char* long_name() const noexcept override { return "minutes"; }
} const minute{};
struct hour_unit final : public duration_unit_impl<5, nanoseconds_counter, minute_unit::factor * 60> {
const char* short_name() const noexcept override { return "h"; }
const char* long_name() const noexcept override { return "hours"; }
} const hour{};
struct day_unit final : public duration_unit_impl<6, days_counter, 1> {
const char* short_name() const noexcept override { return "d"; }
const char* long_name() const noexcept override { return "days"; }
} const day{};
struct week_unit final : public duration_unit_impl<7, days_counter, 7> {
const char* short_name() const noexcept override { return "w"; }
const char* long_name() const noexcept override { return "weeks"; }
} const week{};
struct month_unit final : public duration_unit_impl<8, months_counter, 1> {
const char* short_name() const noexcept override { return "mo"; }
const char* long_name() const noexcept override { return "months"; }
} const month{};
struct year_unit final : public duration_unit_impl<9, months_counter, 12> {
const char* short_name() const noexcept override { return "y"; }
const char* long_name() const noexcept override { return "years"; }
} const year{};
const auto unit_table = std::unordered_map<std::string_view, std::reference_wrapper<const duration_unit>>{
{year.short_name(), year},
{month.short_name(), month},
{week.short_name(), week},
{day.short_name(), day},
{hour.short_name(), hour},
{minute.short_name(), minute},
{second.short_name(), second},
{millisecond.short_name(), millisecond},
{microsecond.short_name(), microsecond}, {"µs", microsecond},
{nanosecond.short_name(), nanosecond}
};
//
// Convenient helper to parse the indexed sub-expression from a match group as a duration counter.
//
// Throws `std::out_of_range` if a counter is out of range.
//
template <class Match, class Index = typename Match::size_type>
cql_duration::common_counter_type parse_count(const Match& m, Index group_index) {
try {
return boost::lexical_cast<cql_duration::common_counter_type>(m[group_index].str());
} catch (const boost::bad_lexical_cast&) {
throw std::out_of_range("duration counter");
}
}
//
// Build up a duration unit-by-unit.
//
// We support overflow detection on construction for convenience and compatibility with Cassandra.
//
// We maintain some additional state over a `cql_duration` in order to track the order in which components are added when
// parsing the standard format.
//
class duration_builder final {
public:
duration_builder& add(cql_duration::common_counter_type count, const duration_unit& unit) {
validate_addition(count, unit);
validate_and_update_order(unit);
unit.increment_count(_duration, count);
return *this;
}
template <class Match, class Index = typename Match::size_type>
duration_builder& add_parsed_count(const Match& m, Index group_index, const duration_unit& unit) {
cql_duration::common_counter_type count;
try {
count = parse_count(m, group_index);
} catch (const std::out_of_range&) {
throw cql_duration_error(seastar::format("Invalid duration. The count for the {} is out of range", unit.long_name()));
}
return add(count, unit);
}
cql_duration build() const noexcept {
return _duration;
}
private:
const duration_unit* _current_unit{nullptr};
cql_duration _duration{};
//
// Throws `cql_duration_error` if the addition of a quantity of the designated unit would overflow one of the
// counters.
//
void validate_addition(typename cql_duration::common_counter_type count, const duration_unit& unit) const {
const auto available = unit.available_count(_duration);
if (count > available) {
throw cql_duration_error(
seastar::format("Invalid duration. The number of {} must be less than or equal to {}",
unit.long_name(),
available));
}
}
//
// Validate that an addition of a quantity of the designated unit is not out of order. We require that units are
// added in decreasing size.
//
// This function also updates the last-observed unit for the next invocation.
//
// Throws `cql_duration_error` for order violations.
//
void validate_and_update_order(const duration_unit& unit) {
const auto index = unit.index();
if (_current_unit != nullptr) {
if (index == _current_unit->index()) {
throw cql_duration_error(seastar::format("Invalid duration. The {} are specified multiple times", unit.long_name()));
} else if (index > _current_unit->index()) {
throw cql_duration_error(
seastar::format("Invalid duration. The {} should be after {}",
_current_unit->long_name(),
unit.long_name()));
}
}
_current_unit = &unit;
}
};
//
// These functions assume no sign information ('-). That is left to the `cql_duration` constructor.
//
std::optional<cql_duration> parse_duration_standard_format(std::string_view s) {
//
// We parse one component (pair of a count and unit) at a time in order to give more precise error messages when
// units are specified multiple times or out of order rather than just "parse error".
//
// The other formats are more strict and complain less helpfully.
//
static const auto pattern =
boost::regex("(\\d+)(y|Y|mo|MO|mO|Mo|w|W|d|D|h|H|s|S|ms|MS|mS|Ms|us|US|uS|Us|µs|µS|ns|NS|nS|Ns|m|M)");
auto iter = s.cbegin();
boost::cmatch match;
duration_builder b;
// `match_continuous` ensures that the entire string must be included in a match.
while (boost::regex_search(iter, s.end(), match, pattern, boost::regex_constants::match_continuous)) {
iter += match.length();
auto symbol = match[2].str();
// Special case for mu.
{
auto view = std::string_view(symbol);
view.remove_suffix(1);
if (view == reinterpret_cast<const char*>(u8"µ")) {
b.add_parsed_count(match, 1, microsecond);
continue;
}
}
// Otherwise, we can just convert to lower-case for look-up.
std::transform(symbol.begin(), symbol.end(), symbol.begin(), [](char ch) { return std::tolower(ch); });
b.add_parsed_count(match, 1, unit_table.at(symbol));
}
if (iter != s.cend()) {
// There is unconsumed input.
return {};
}
return b.build();
}
std::optional<cql_duration> parse_duration_iso8601_format(std::string_view s) {
static const auto pattern = boost::regex("P((\\d+)Y)?((\\d+)M)?((\\d+)D)?(T((\\d+)H)?((\\d+)M)?((\\d+)S)?)?");
boost::cmatch match;
if (!boost::regex_match(s.data(), match, pattern)) {
return {};
}
duration_builder b;
if (match[1].matched) {
b.add_parsed_count(match, 2, year);
}
if (match[3].matched) {
b.add_parsed_count(match, 4, month);
}
if (match[5].matched) {
b.add_parsed_count(match, 6, day);
}
// Optional, more granular, information.
if (match[7].matched) {
if (match[8].matched) {
b.add_parsed_count(match, 9, hour);
}
if (match[10].matched) {
b.add_parsed_count(match, 11, minute);
}
if (match[12].matched) {
b.add_parsed_count(match, 13, second);
}
}
return b.build();
}
std::optional<cql_duration> parse_duration_iso8601_alternative_format(std::string_view s) {
static const auto pattern = boost::regex("P(\\d{4})-(\\d{2})-(\\d{2})T(\\d{2}):(\\d{2}):(\\d{2})");
boost::cmatch match;
if (!boost::regex_match(s.data(), match, pattern)) {
return {};
}
return duration_builder()
.add_parsed_count(match, 1, year)
.add_parsed_count(match, 2, month)
.add_parsed_count(match, 3, day)
.add_parsed_count(match, 4, hour)
.add_parsed_count(match, 5, minute)
.add_parsed_count(match, 6, second)
.build();
}
std::optional<cql_duration> parse_duration_iso8601_week_format(std::string_view s) {
static const auto pattern = boost::regex("P(\\d+)W");
boost::cmatch match;
if (!boost::regex_match(s.data(), match, pattern)) {
return {};
}
return duration_builder()
.add_parsed_count(match, 1, week)
.build();
}
// Parse a duration string without sign information assuming one of the supported formats.
std::optional<cql_duration> parse_duration(std::string_view s) {
if (s.length() == 0u) {
return {};
}
if (s.front() == 'P') {
if (s.back() == 'W') {
return parse_duration_iso8601_week_format(s);
}
if (s.find('-') != s.npos) {
return parse_duration_iso8601_alternative_format(s);
}
return parse_duration_iso8601_format(s);
}
return parse_duration_standard_format(s);
}
}
cql_duration::cql_duration(std::string_view s) {
const bool is_negative = (s.length() != 0) && (s[0] == '-');
// Without any sign indicator ('-').
const auto ps = (is_negative ? s.cbegin() + 1 : s.cbegin());
const auto d = parse_duration(ps);
if (!d) {
throw cql_duration_error(seastar::format("Unable to convert '{}' to a duration", s));
}
*this = *d;
if (is_negative) {
months = -months;
days = -days;
nanoseconds = -nanoseconds;
}
}
std::ostream& operator<<(std::ostream& os, const cql_duration& d) {
if ((d.months < 0) || (d.days < 0) || (d.nanoseconds < 0)) {
os << '-';
}
// If a non-zero integral component of the count can be expressed in `unit`, then append it to the stream with its
// unit.
//
// Returns the remaining count.
const auto append = [&os](cql_duration::common_counter_type count, auto&& unit) {
const auto divider = unit.factor;
if ((count == 0) || (count < divider)) {
return count;
}
os << (count / divider) << unit.short_name();
return count % divider;
};
const auto month_remainder = append(std::abs(d.months), year);
append(month_remainder, month);
append(std::abs(d.days), day);
auto nanosecond_remainder = append(std::abs(d.nanoseconds), hour);
nanosecond_remainder = append(nanosecond_remainder, minute);
nanosecond_remainder = append(nanosecond_remainder, second);
nanosecond_remainder = append(nanosecond_remainder, millisecond);
nanosecond_remainder = append(nanosecond_remainder, microsecond);
append(nanosecond_remainder, nanosecond);
return os;
}
seastar::sstring to_string(const cql_duration& d) {
std::ostringstream ss;
ss << d;
return ss.str();
}