Bitcoin Core  29.1.0
P2P Digital Currency
strencodings.h
Go to the documentation of this file.
1 // Copyright (c) 2009-2010 Satoshi Nakamoto
2 // Copyright (c) 2009-2022 The Bitcoin Core developers
3 // Distributed under the MIT software license, see the accompanying
4 // file COPYING or http://www.opensource.org/licenses/mit-license.php.
5 
9 #ifndef BITCOIN_UTIL_STRENCODINGS_H
10 #define BITCOIN_UTIL_STRENCODINGS_H
11 
12 #include <crypto/hex_base.h> // IWYU pragma: export
13 #include <span.h>
14 #include <util/string.h>
15 
16 #include <array>
17 #include <bit>
18 #include <charconv>
19 #include <cstddef>
20 #include <cstdint>
21 #include <limits>
22 #include <optional>
23 #include <string> // IWYU pragma: export
24 #include <string_view> // IWYU pragma: export
25 #include <system_error>
26 #include <type_traits>
27 #include <vector>
28 
31 {
36 };
37 
43 enum class ByteUnit : uint64_t {
44  NOOP = 1ULL,
45  k = 1000ULL,
46  K = 1024ULL,
47  m = 1'000'000ULL,
48  M = 1ULL << 20,
49  g = 1'000'000'000ULL,
50  G = 1ULL << 30,
51  t = 1'000'000'000'000ULL,
52  T = 1ULL << 40,
53 };
54 
62 std::string SanitizeString(std::string_view str, int rule = SAFE_CHARS_DEFAULT);
64 template <typename Byte = std::byte>
65 std::optional<std::vector<Byte>> TryParseHex(std::string_view str);
67 template <typename Byte = uint8_t>
68 std::vector<Byte> ParseHex(std::string_view hex_str)
69 {
70  return TryParseHex<Byte>(hex_str).value_or(std::vector<Byte>{});
71 }
72 /* Returns true if each character in str is a hex character, and has an even
73  * number of hex digits.*/
74 bool IsHex(std::string_view str);
75 std::optional<std::vector<unsigned char>> DecodeBase64(std::string_view str);
76 std::string EncodeBase64(Span<const unsigned char> input);
77 inline std::string EncodeBase64(Span<const std::byte> input) { return EncodeBase64(MakeUCharSpan(input)); }
78 inline std::string EncodeBase64(std::string_view str) { return EncodeBase64(MakeUCharSpan(str)); }
79 std::optional<std::vector<unsigned char>> DecodeBase32(std::string_view str);
80 
86 std::string EncodeBase32(Span<const unsigned char> input, bool pad = true);
87 
93 std::string EncodeBase32(std::string_view str, bool pad = true);
94 
104 bool SplitHostPort(std::string_view in, uint16_t& portOut, std::string& hostOut);
105 
106 // LocaleIndependentAtoi is provided for backwards compatibility reasons.
107 //
108 // New code should use ToIntegral or the ParseInt* functions
109 // which provide parse error feedback.
110 //
111 // The goal of LocaleIndependentAtoi is to replicate the defined behaviour of
112 // std::atoi as it behaves under the "C" locale, and remove some undefined
113 // behavior. If the parsed value is bigger than the integer type's maximum
114 // value, or smaller than the integer type's minimum value, std::atoi has
115 // undefined behavior, while this function returns the maximum or minimum
116 // values, respectively.
117 template <typename T>
118 T LocaleIndependentAtoi(std::string_view str)
119 {
120  static_assert(std::is_integral<T>::value);
121  T result;
122  // Emulate atoi(...) handling of white space and leading +/-.
123  std::string_view s = util::TrimStringView(str);
124  if (!s.empty() && s[0] == '+') {
125  if (s.length() >= 2 && s[1] == '-') {
126  return 0;
127  }
128  s = s.substr(1);
129  }
130  auto [_, error_condition] = std::from_chars(s.data(), s.data() + s.size(), result);
131  if (error_condition == std::errc::result_out_of_range) {
132  if (s.length() >= 1 && s[0] == '-') {
133  // Saturate underflow, per strtoll's behavior.
134  return std::numeric_limits<T>::min();
135  } else {
136  // Saturate overflow, per strtoll's behavior.
137  return std::numeric_limits<T>::max();
138  }
139  } else if (error_condition != std::errc{}) {
140  return 0;
141  }
142  return result;
143 }
144 
150 constexpr bool IsDigit(char c)
151 {
152  return c >= '0' && c <= '9';
153 }
154 
166 constexpr inline bool IsSpace(char c) noexcept {
167  return c == ' ' || c == '\f' || c == '\n' || c == '\r' || c == '\t' || c == '\v';
168 }
169 
178 template <typename T>
179 std::optional<T> ToIntegral(std::string_view str)
180 {
181  static_assert(std::is_integral<T>::value);
182  T result;
183  const auto [first_nonmatching, error_condition] = std::from_chars(str.data(), str.data() + str.size(), result);
184  if (first_nonmatching != str.data() + str.size() || error_condition != std::errc{}) {
185  return std::nullopt;
186  }
187  return result;
188 }
189 
195 [[nodiscard]] bool ParseInt32(std::string_view str, int32_t *out);
196 
202 [[nodiscard]] bool ParseInt64(std::string_view str, int64_t *out);
203 
209 [[nodiscard]] bool ParseUInt8(std::string_view str, uint8_t *out);
210 
216 [[nodiscard]] bool ParseUInt16(std::string_view str, uint16_t* out);
217 
223 [[nodiscard]] bool ParseUInt32(std::string_view str, uint32_t *out);
224 
230 [[nodiscard]] bool ParseUInt64(std::string_view str, uint64_t *out);
231 
236 std::string FormatParagraph(std::string_view in, size_t width = 79, size_t indent = 0);
237 
243 template <typename T>
244 bool TimingResistantEqual(const T& a, const T& b)
245 {
246  if (b.size() == 0) return a.size() == 0;
247  size_t accumulator = a.size() ^ b.size();
248  for (size_t i = 0; i < a.size(); i++)
249  accumulator |= size_t(a[i] ^ b[i%b.size()]);
250  return accumulator == 0;
251 }
252 
257 [[nodiscard]] bool ParseFixedPoint(std::string_view, int decimals, int64_t *amount_out);
258 
259 namespace {
261 struct IntIdentity
262 {
263  [[maybe_unused]] int operator()(int x) const { return x; }
264 };
265 
266 } // namespace
267 
269 template<int frombits, int tobits, bool pad, typename O, typename It, typename I = IntIdentity>
270 bool ConvertBits(O outfn, It it, It end, I infn = {}) {
271  size_t acc = 0;
272  size_t bits = 0;
273  constexpr size_t maxv = (1 << tobits) - 1;
274  constexpr size_t max_acc = (1 << (frombits + tobits - 1)) - 1;
275  while (it != end) {
276  int v = infn(*it);
277  if (v < 0) return false;
278  acc = ((acc << frombits) | v) & max_acc;
279  bits += frombits;
280  while (bits >= tobits) {
281  bits -= tobits;
282  outfn((acc >> bits) & maxv);
283  }
284  ++it;
285  }
286  if (pad) {
287  if (bits) outfn((acc << (tobits - bits)) & maxv);
288  } else if (bits >= frombits || ((acc << (tobits - bits)) & maxv)) {
289  return false;
290  }
291  return true;
292 }
293 
304 constexpr char ToLower(char c)
305 {
306  return (c >= 'A' && c <= 'Z' ? (c - 'A') + 'a' : c);
307 }
308 
318 std::string ToLower(std::string_view str);
319 
330 constexpr char ToUpper(char c)
331 {
332  return (c >= 'a' && c <= 'z' ? (c - 'a') + 'A' : c);
333 }
334 
344 std::string ToUpper(std::string_view str);
345 
355 std::string Capitalize(std::string str);
356 
368 std::optional<uint64_t> ParseByteUnits(std::string_view str, ByteUnit default_multiplier);
369 
370 namespace util {
372 consteval uint8_t ConstevalHexDigit(const char c)
373 {
374  if (c >= '0' && c <= '9') return c - '0';
375  if (c >= 'a' && c <= 'f') return c - 'a' + 0xa;
376 
377  throw "Only lowercase hex digits are allowed, for consistency";
378 }
379 
380 namespace detail {
381 template <size_t N>
382 struct Hex {
383  std::array<std::byte, N / 2> bytes{};
384  consteval Hex(const char (&hex_str)[N])
385  // 2 hex digits required per byte + implicit null terminator
386  requires(N % 2 == 1)
387  {
388  if (hex_str[N - 1]) throw "null terminator required";
389  for (std::size_t i = 0; i < bytes.size(); ++i) {
390  bytes[i] = static_cast<std::byte>(
391  (ConstevalHexDigit(hex_str[2 * i]) << 4) |
392  ConstevalHexDigit(hex_str[2 * i + 1]));
393  }
394  }
395 };
396 } // namespace detail
397 
427 inline namespace hex_literals {
428 
429 template <util::detail::Hex str>
430 constexpr auto operator""_hex() { return str.bytes; }
431 
432 template <util::detail::Hex str>
433 constexpr auto operator""_hex_u8() { return std::bit_cast<std::array<uint8_t, str.bytes.size()>>(str.bytes); }
434 
435 template <util::detail::Hex str>
436 constexpr auto operator""_hex_v() { return std::vector<std::byte>{str.bytes.begin(), str.bytes.end()}; }
437 
438 template <util::detail::Hex str>
439 inline auto operator""_hex_v_u8() { return std::vector<uint8_t>{UCharCast(str.bytes.data()), UCharCast(str.bytes.data() + str.bytes.size())}; }
440 
441 } // inline namespace hex_literals
442 } // namespace util
443 
444 #endif // BITCOIN_UTIL_STRENCODINGS_H
bool TimingResistantEqual(const T &a, const T &b)
Timing-attack-resistant comparison.
Definition: strencodings.h:244
The full set of allowed chars.
Definition: strencodings.h:32
constexpr char ToUpper(char c)
Converts the given character to its uppercase equivalent.
Definition: strencodings.h:330
T LocaleIndependentAtoi(std::string_view str)
Definition: strencodings.h:118
std::optional< uint64_t > ParseByteUnits(std::string_view str, ByteUnit default_multiplier)
Parse a string with suffix unit [k|K|m|M|g|G|t|T].
bool ParseUInt64(std::string_view str, uint64_t *out)
Convert decimal string to unsigned 64-bit integer with strict parse error feedback.
bool ParseUInt16(std::string_view str, uint16_t *out)
Convert decimal string to unsigned 16-bit integer with strict parse error feedback.
bool ParseFixedPoint(std::string_view, int decimals, int64_t *amount_out)
Parse number as fixed point according to JSON number syntax.
constexpr bool IsDigit(char c)
Tests if the given character is a decimal digit.
Definition: strencodings.h:150
bool ParseUInt32(std::string_view str, uint32_t *out)
Convert decimal string to unsigned 32-bit integer with strict parse error feedback.
consteval auto _(util::TranslatedLiteral str)
Definition: translation.h:79
bool ParseInt32(std::string_view str, int32_t *out)
Convert string to signed 32-bit integer with strict parse error feedback.
std::string_view TrimStringView(std::string_view str, std::string_view pattern=" \\\)
Definition: string.h:146
consteval uint8_t ConstevalHexDigit(const char c)
consteval version of HexDigit() without the lookup table.
Definition: strencodings.h:372
SafeChars
Utilities for converting data from/to strings.
Definition: strencodings.h:30
bool ParseUInt8(std::string_view str, uint8_t *out)
Convert decimal string to unsigned 8-bit integer with strict parse error feedback.
std::string Capitalize(std::string str)
Capitalizes the first character of the given string.
ByteUnit
Used by ParseByteUnits() Lowercase base 1000 Uppercase base 1024.
Definition: strencodings.h:43
Chars allowed in filenames.
Definition: strencodings.h:34
auto result
Definition: common-types.h:74
constexpr bool IsSpace(char c) noexcept
Tests if the given character is a whitespace character.
Definition: strencodings.h:166
std::optional< T > ToIntegral(std::string_view str)
Convert string to integral type T.
Definition: strencodings.h:179
unsigned char * UCharCast(char *c)
Definition: span.h:280
bool ParseInt64(std::string_view str, int64_t *out)
Convert string to signed 64-bit integer with strict parse error feedback.
constexpr char ToLower(char c)
Converts the given character to its lowercase equivalent.
Definition: strencodings.h:304
bool ConvertBits(O outfn, It it, It end, I infn={})
Convert from one power-of-2 number base to another.
Definition: strencodings.h:270
Chars allowed in URIs (RFC 3986)
Definition: strencodings.h:35
std::string FormatParagraph(std::string_view in, size_t width=79, size_t indent=0)
Format a paragraph of text to a fixed width, adding spaces for indentation to any added line...
BIP-0014 subset.
Definition: strencodings.h:33
std::array< std::byte, N/2 > bytes
Definition: strencodings.h:383