Bitcoin Core 28.0.0
P2P Digital Currency
Loading...
Searching...
No Matches
strencodings.h
Go to the documentation of this file.
1// Copyright (c) 2009-2010 Satoshi Nakamoto
2// Copyright (c) 2009-2022 The Bitcoin Core developers
3// Distributed under the MIT software license, see the accompanying
4// file COPYING or http://www.opensource.org/licenses/mit-license.php.
5
9#ifndef BITCOIN_UTIL_STRENCODINGS_H
10#define BITCOIN_UTIL_STRENCODINGS_H
11
12#include <crypto/hex_base.h> // IWYU pragma: export
13#include <span.h>
14#include <util/string.h>
15
16#include <charconv>
17#include <cstddef>
18#include <cstdint>
19#include <limits>
20#include <optional>
21#include <string> // IWYU pragma: export
22#include <string_view> // IWYU pragma: export
23#include <system_error>
24#include <type_traits>
25#include <vector>
26
35
41enum class ByteUnit : uint64_t {
42 NOOP = 1ULL,
43 k = 1000ULL,
44 K = 1024ULL,
45 m = 1'000'000ULL,
46 M = 1ULL << 20,
47 g = 1'000'000'000ULL,
48 G = 1ULL << 30,
49 t = 1'000'000'000'000ULL,
50 T = 1ULL << 40,
51};
52
60std::string SanitizeString(std::string_view str, int rule = SAFE_CHARS_DEFAULT);
62template <typename Byte = std::byte>
63std::optional<std::vector<Byte>> TryParseHex(std::string_view str);
65template <typename Byte = uint8_t>
66std::vector<Byte> ParseHex(std::string_view hex_str)
67{
68 return TryParseHex<Byte>(hex_str).value_or(std::vector<Byte>{});
69}
70/* Returns true if each character in str is a hex character, and has an even
71 * number of hex digits.*/
72bool IsHex(std::string_view str);
76bool IsHexNumber(std::string_view str);
77std::optional<std::vector<unsigned char>> DecodeBase64(std::string_view str);
79inline std::string EncodeBase64(Span<const std::byte> input) { return EncodeBase64(MakeUCharSpan(input)); }
80inline std::string EncodeBase64(std::string_view str) { return EncodeBase64(MakeUCharSpan(str)); }
81std::optional<std::vector<unsigned char>> DecodeBase32(std::string_view str);
82
88std::string EncodeBase32(Span<const unsigned char> input, bool pad = true);
89
95std::string EncodeBase32(std::string_view str, bool pad = true);
96
106bool SplitHostPort(std::string_view in, uint16_t& portOut, std::string& hostOut);
107
108// LocaleIndependentAtoi is provided for backwards compatibility reasons.
109//
110// New code should use ToIntegral or the ParseInt* functions
111// which provide parse error feedback.
112//
113// The goal of LocaleIndependentAtoi is to replicate the defined behaviour of
114// std::atoi as it behaves under the "C" locale, and remove some undefined
115// behavior. If the parsed value is bigger than the integer type's maximum
116// value, or smaller than the integer type's minimum value, std::atoi has
117// undefined behavior, while this function returns the maximum or minimum
118// values, respectively.
119template <typename T>
120T LocaleIndependentAtoi(std::string_view str)
121{
122 static_assert(std::is_integral<T>::value);
123 T result;
124 // Emulate atoi(...) handling of white space and leading +/-.
125 std::string_view s = util::TrimStringView(str);
126 if (!s.empty() && s[0] == '+') {
127 if (s.length() >= 2 && s[1] == '-') {
128 return 0;
129 }
130 s = s.substr(1);
131 }
132 auto [_, error_condition] = std::from_chars(s.data(), s.data() + s.size(), result);
133 if (error_condition == std::errc::result_out_of_range) {
134 if (s.length() >= 1 && s[0] == '-') {
135 // Saturate underflow, per strtoll's behavior.
136 return std::numeric_limits<T>::min();
137 } else {
138 // Saturate overflow, per strtoll's behavior.
139 return std::numeric_limits<T>::max();
140 }
141 } else if (error_condition != std::errc{}) {
142 return 0;
143 }
144 return result;
145}
146
152constexpr bool IsDigit(char c)
153{
154 return c >= '0' && c <= '9';
155}
156
168constexpr inline bool IsSpace(char c) noexcept {
169 return c == ' ' || c == '\f' || c == '\n' || c == '\r' || c == '\t' || c == '\v';
170}
171
180template <typename T>
181std::optional<T> ToIntegral(std::string_view str)
182{
183 static_assert(std::is_integral<T>::value);
184 T result;
185 const auto [first_nonmatching, error_condition] = std::from_chars(str.data(), str.data() + str.size(), result);
186 if (first_nonmatching != str.data() + str.size() || error_condition != std::errc{}) {
187 return std::nullopt;
188 }
189 return result;
190}
191
197[[nodiscard]] bool ParseInt32(std::string_view str, int32_t *out);
198
204[[nodiscard]] bool ParseInt64(std::string_view str, int64_t *out);
205
211[[nodiscard]] bool ParseUInt8(std::string_view str, uint8_t *out);
212
218[[nodiscard]] bool ParseUInt16(std::string_view str, uint16_t* out);
219
225[[nodiscard]] bool ParseUInt32(std::string_view str, uint32_t *out);
226
232[[nodiscard]] bool ParseUInt64(std::string_view str, uint64_t *out);
233
238std::string FormatParagraph(std::string_view in, size_t width = 79, size_t indent = 0);
239
245template <typename T>
246bool TimingResistantEqual(const T& a, const T& b)
247{
248 if (b.size() == 0) return a.size() == 0;
249 size_t accumulator = a.size() ^ b.size();
250 for (size_t i = 0; i < a.size(); i++)
251 accumulator |= size_t(a[i] ^ b[i%b.size()]);
252 return accumulator == 0;
253}
254
259[[nodiscard]] bool ParseFixedPoint(std::string_view, int decimals, int64_t *amount_out);
260
261namespace {
263struct IntIdentity
264{
265 [[maybe_unused]] int operator()(int x) const { return x; }
266};
267
268} // namespace
269
271template<int frombits, int tobits, bool pad, typename O, typename It, typename I = IntIdentity>
272bool ConvertBits(O outfn, It it, It end, I infn = {}) {
273 size_t acc = 0;
274 size_t bits = 0;
275 constexpr size_t maxv = (1 << tobits) - 1;
276 constexpr size_t max_acc = (1 << (frombits + tobits - 1)) - 1;
277 while (it != end) {
278 int v = infn(*it);
279 if (v < 0) return false;
280 acc = ((acc << frombits) | v) & max_acc;
281 bits += frombits;
282 while (bits >= tobits) {
283 bits -= tobits;
284 outfn((acc >> bits) & maxv);
285 }
286 ++it;
287 }
288 if (pad) {
289 if (bits) outfn((acc << (tobits - bits)) & maxv);
290 } else if (bits >= frombits || ((acc << (tobits - bits)) & maxv)) {
291 return false;
292 }
293 return true;
294}
295
306constexpr char ToLower(char c)
307{
308 return (c >= 'A' && c <= 'Z' ? (c - 'A') + 'a' : c);
309}
310
320std::string ToLower(std::string_view str);
321
332constexpr char ToUpper(char c)
333{
334 return (c >= 'a' && c <= 'z' ? (c - 'a') + 'A' : c);
335}
336
346std::string ToUpper(std::string_view str);
347
357std::string Capitalize(std::string str);
358
370std::optional<uint64_t> ParseByteUnits(std::string_view str, ByteUnit default_multiplier);
371
372#endif // BITCOIN_UTIL_STRENCODINGS_H
A Span is an object that can refer to a contiguous sequence of objects.
Definition span.h:98
std::string_view TrimStringView(std::string_view str, std::string_view pattern=" \f\n\r\t\v")
Definition string.h:69
constexpr auto MakeUCharSpan(V &&v) -> decltype(UCharSpanCast(Span{std::forward< V >(v)}))
Like the Span constructor, but for (const) unsigned char member types only.
Definition span.h:304
std::string EncodeBase32(Span< const unsigned char > input, bool pad=true)
Base32 encode.
std::string Capitalize(std::string str)
Capitalizes the first character of the given string.
bool IsHexNumber(std::string_view str)
Return true if the string is a hex number, optionally prefixed with "0x".
bool ParseInt32(std::string_view str, int32_t *out)
Convert string to signed 32-bit integer with strict parse error feedback.
bool ParseUInt16(std::string_view str, uint16_t *out)
Convert decimal string to unsigned 16-bit integer with strict parse error feedback.
constexpr char ToLower(char c)
Converts the given character to its lowercase equivalent.
constexpr bool IsDigit(char c)
Tests if the given character is a decimal digit.
std::string EncodeBase64(Span< const unsigned char > input)
constexpr char ToUpper(char c)
Converts the given character to its uppercase equivalent.
std::optional< std::vector< unsigned char > > DecodeBase32(std::string_view str)
T LocaleIndependentAtoi(std::string_view str)
bool ParseInt64(std::string_view str, int64_t *out)
Convert string to signed 64-bit integer with strict parse error feedback.
ByteUnit
Used by ParseByteUnits() Lowercase base 1000 Uppercase base 1024.
bool TimingResistantEqual(const T &a, const T &b)
Timing-attack-resistant comparison.
bool ParseUInt8(std::string_view str, uint8_t *out)
Convert decimal string to unsigned 8-bit integer with strict parse error feedback.
std::vector< Byte > ParseHex(std::string_view hex_str)
Like TryParseHex, but returns an empty vector on invalid input.
bool ParseFixedPoint(std::string_view, int decimals, int64_t *amount_out)
Parse number as fixed point according to JSON number syntax.
bool ParseUInt64(std::string_view str, uint64_t *out)
Convert decimal string to unsigned 64-bit integer with strict parse error feedback.
constexpr bool IsSpace(char c) noexcept
Tests if the given character is a whitespace character.
bool IsHex(std::string_view str)
std::optional< std::vector< unsigned char > > DecodeBase64(std::string_view str)
std::optional< T > ToIntegral(std::string_view str)
Convert string to integral type T.
bool SplitHostPort(std::string_view in, uint16_t &portOut, std::string &hostOut)
Splits socket address string into host string and port value.
bool ParseUInt32(std::string_view str, uint32_t *out)
Convert decimal string to unsigned 32-bit integer with strict parse error feedback.
bool ConvertBits(O outfn, It it, It end, I infn={})
Convert from one power-of-2 number base to another.
std::string FormatParagraph(std::string_view in, size_t width=79, size_t indent=0)
Format a paragraph of text to a fixed width, adding spaces for indentation to any added line.
std::string SanitizeString(std::string_view str, int rule=SAFE_CHARS_DEFAULT)
Remove unsafe chars.
std::optional< std::vector< Byte > > TryParseHex(std::string_view str)
Parse the hex string into bytes (uint8_t or std::byte).
std::optional< uint64_t > ParseByteUnits(std::string_view str, ByteUnit default_multiplier)
Parse a string with suffix unit [k|K|m|M|g|G|t|T].
SafeChars
Utilities for converting data from/to strings.
@ SAFE_CHARS_DEFAULT
The full set of allowed chars.
@ SAFE_CHARS_UA_COMMENT
BIP-0014 subset.
@ SAFE_CHARS_URI
Chars allowed in URIs (RFC 3986)
@ SAFE_CHARS_FILENAME
Chars allowed in filenames.
bilingual_str _(ConstevalStringLiteral str)
Translation function.
Definition translation.h:80