Bitcoin Core 31.99.0
P2P Digital Currency
util_string_tests.cpp
Go to the documentation of this file.
1// Copyright (c) 2024-present The Bitcoin Core developers
2// Distributed under the MIT software license, see the accompanying
3// file COPYING or http://www.opensource.org/licenses/mit-license.php.
4
5#include <util/strencodings.h>
6#include <util/string.h>
7#include <vector>
8
9#include <boost/test/unit_test.hpp>
10#include <test/util/common.h>
11#include <tinyformat.h>
12
13using namespace util;
15
16BOOST_AUTO_TEST_SUITE(util_string_tests)
17
18template <unsigned NumArgs>
19void TfmFormatZeroes(const std::string& fmt)
20{
21 std::apply([&](auto... args) {
22 (void)tfm::format(tfm::RuntimeFormat{fmt}, args...);
23 }, std::array<int, NumArgs>{});
24}
25
26// Helper to allow compile-time sanity checks while providing the number of
27// args directly. Normally PassFmt<sizeof...(Args)> would be used.
28template <unsigned NumArgs>
30{
31 // Execute compile-time check again at run-time to get code coverage stats
32 BOOST_CHECK_NO_THROW(CheckNumFormatSpecifiers<NumArgs>(fmt.fmt));
33
34 // If ConstevalFormatString didn't throw above, make sure tinyformat doesn't
35 // throw either for the same format string and parameter count combination.
36 // Proves that we have some extent of protection from runtime errors
37 // (tinyformat may still throw for some type mismatches).
38 BOOST_CHECK_NO_THROW(TfmFormatZeroes<NumArgs>(fmt.fmt));
39}
40template <unsigned WrongNumArgs>
41void FailFmtWithError(const char* wrong_fmt, std::string_view error)
42{
43 BOOST_CHECK_EXCEPTION(CheckNumFormatSpecifiers<WrongNumArgs>(wrong_fmt), const char*, HasReason{error});
44}
45
46std::vector<std::byte> StringToBuffer(const std::string& str)
47{
48 auto span = std::as_bytes(std::span(str));
49 return {span.begin(), span.end()};
50}
51
52BOOST_AUTO_TEST_CASE(ConstevalFormatString_NumSpec)
53{
54 PassFmt<0>("");
55 PassFmt<0>("%%");
56 PassFmt<1>("%s");
57 PassFmt<1>("%c");
58 PassFmt<0>("%%s");
59 PassFmt<0>("s%%");
60 PassFmt<1>("%%%s");
61 PassFmt<1>("%s%%");
62 PassFmt<0>(" 1$s");
63 PassFmt<1>("%1$s");
64 PassFmt<1>("%1$s%1$s");
65 PassFmt<2>("%2$s");
66 PassFmt<2>("%2$s 4$s %2$s");
67 PassFmt<129>("%129$s 999$s %2$s");
68 PassFmt<1>("%02d");
69 PassFmt<1>("%+2s");
70 PassFmt<1>("%.6i");
71 PassFmt<1>("%5.2f");
72 PassFmt<1>("%5.f");
73 PassFmt<1>("%.f");
74 PassFmt<1>("%#x");
75 PassFmt<1>("%1$5i");
76 PassFmt<1>("%1$-5i");
77 PassFmt<1>("%1$.5i");
78 // tinyformat accepts almost any "type" spec, even '%', or '_', or '\n'.
79 PassFmt<1>("%123%");
80 PassFmt<1>("%123%s");
81 PassFmt<1>("%_");
82 PassFmt<1>("%\n");
83
84 PassFmt<2>("%*c");
85 PassFmt<2>("%+*c");
86 PassFmt<2>("%.*f");
87 PassFmt<3>("%*.*f");
88 PassFmt<3>("%2$*3$d");
89 PassFmt<3>("%2$*3$.9d");
90 PassFmt<3>("%2$.*3$d");
91 PassFmt<3>("%2$9.*3$d");
92 PassFmt<3>("%2$+9.*3$d");
93 PassFmt<4>("%3$*2$.*4$f");
94
95 // Make sure multiple flag characters "- 0+" are accepted
96 PassFmt<3>("'%- 0+*.*f'");
97 PassFmt<3>("'%1$- 0+*3$.*2$f'");
98
99 auto err_mix{"Format specifiers must be all positional or all non-positional!"};
100 FailFmtWithError<1>("%s%1$s", err_mix);
101 FailFmtWithError<2>("%2$*d", err_mix);
102 FailFmtWithError<2>("%*2$d", err_mix);
103 FailFmtWithError<2>("%.*3$d", err_mix);
104 FailFmtWithError<2>("%2$.*d", err_mix);
105
106 auto err_num{"Format specifier count must match the argument count!"};
107 FailFmtWithError<1>("", err_num);
108 FailFmtWithError<0>("%s", err_num);
109 FailFmtWithError<2>("%s", err_num);
110 FailFmtWithError<0>("%1$s", err_num);
111 FailFmtWithError<2>("%1$s", err_num);
112 FailFmtWithError<1>("%*c", err_num);
113
114 auto err_0_pos{"Positional format specifier must have position of at least 1"};
115 FailFmtWithError<1>("%$s", err_0_pos);
116 FailFmtWithError<1>("%$", err_0_pos);
117 FailFmtWithError<0>("%0$", err_0_pos);
118 FailFmtWithError<0>("%0$s", err_0_pos);
119 FailFmtWithError<2>("%2$*$d", err_0_pos);
120 FailFmtWithError<2>("%2$*0$d", err_0_pos);
121 FailFmtWithError<3>("%3$*2$.*$f", err_0_pos);
122 FailFmtWithError<3>("%3$*2$.*0$f", err_0_pos);
123
124 auto err_term{"Format specifier incorrectly terminated by end of string"};
125 FailFmtWithError<1>("%", err_term);
126 FailFmtWithError<1>("%9", err_term);
127 FailFmtWithError<1>("%9.", err_term);
128 FailFmtWithError<1>("%9.9", err_term);
129 FailFmtWithError<1>("%*", err_term);
130 FailFmtWithError<1>("%+*", err_term);
131 FailFmtWithError<1>("%.*", err_term);
132 FailFmtWithError<1>("%9.*", err_term);
133 FailFmtWithError<1>("%1$", err_term);
134 FailFmtWithError<1>("%1$9", err_term);
135 FailFmtWithError<2>("%1$*2$", err_term);
136 FailFmtWithError<2>("%1$.*2$", err_term);
137 FailFmtWithError<2>("%1$9.*2$", err_term);
138
139 // Non-parity between tinyformat and ConstevalFormatString.
140 // tinyformat throws but ConstevalFormatString does not.
141 BOOST_CHECK_EXCEPTION(tfm::format(ConstevalFormatString<1>{"%n"}, 0), tfm::format_error,
142 HasReason{"tinyformat: %n conversion spec not supported"});
143 BOOST_CHECK_EXCEPTION(tfm::format(ConstevalFormatString<2>{"%*s"}, "hi", "hi"), tfm::format_error,
144 HasReason{"tinyformat: Cannot convert from argument type to integer for use as variable width or precision"});
145 BOOST_CHECK_EXCEPTION(tfm::format(ConstevalFormatString<2>{"%.*s"}, "hi", "hi"), tfm::format_error,
146 HasReason{"tinyformat: Cannot convert from argument type to integer for use as variable width or precision"});
147
148 // Ensure that tinyformat throws if format string contains wrong number
149 // of specifiers. PassFmt relies on this to verify tinyformat successfully
150 // formats the strings, and will need to be updated if tinyformat is changed
151 // not to throw on failure.
152 BOOST_CHECK_EXCEPTION(TfmFormatZeroes<2>("%s"), tfm::format_error,
153 HasReason{"tinyformat: Not enough conversion specifiers in format string"});
154 BOOST_CHECK_EXCEPTION(TfmFormatZeroes<1>("%s %s"), tfm::format_error,
155 HasReason{"tinyformat: Too many conversion specifiers in format string"});
156}
157
158BOOST_AUTO_TEST_CASE(ascii_case_insensitive_key_equal_test)
159{
161 BOOST_CHECK(!cmp("A", "B"));
162 BOOST_CHECK(!cmp("A", "b"));
163 BOOST_CHECK(!cmp("a", "B"));
164 BOOST_CHECK(!cmp("B", "A"));
165 BOOST_CHECK(!cmp("B", "a"));
166 BOOST_CHECK(!cmp("b", "A"));
167 BOOST_CHECK(!cmp("A", "AA"));
168 BOOST_CHECK(cmp("A-A", "a-a"));
169 BOOST_CHECK(cmp("A", "A"));
170 BOOST_CHECK(cmp("A", "a"));
171 BOOST_CHECK(cmp("a", "a"));
172 BOOST_CHECK(cmp("B", "b"));
173 BOOST_CHECK(cmp("ab", "aB"));
174 BOOST_CHECK(cmp("Ab", "aB"));
175 BOOST_CHECK(cmp("AB", "ab"));
176
177 // Use a character with value > 127
178 // to ensure we don't trigger implicit-integer-sign-change
179 BOOST_CHECK(!cmp("a", "\xe4"));
180}
181
182BOOST_AUTO_TEST_CASE(ascii_case_insensitive_hash_test)
183{
185 BOOST_CHECK_NE(hsh("A"), hsh("B"));
186 BOOST_CHECK_NE(hsh("AA"), hsh("A"));
187 BOOST_CHECK_EQUAL(hsh("A"), hsh("a"));
188 BOOST_CHECK_EQUAL(hsh("Ab"), hsh("aB"));
189 BOOST_CHECK_EQUAL(hsh("A\xfe"), hsh("a\xfe"));
190}
191
192BOOST_AUTO_TEST_CASE(line_reader_test)
193{
194 {
195 // Check three lines terminated by \n and \r\n, trimming whitespace
196 const std::vector<std::byte> input{StringToBuffer("once upon a time\n there was a dog \r\nwho liked food\n")};
197 LineReader reader(input, /*max_line_length=*/128);
198 std::optional<std::string> line1{reader.ReadLine()};
199 BOOST_CHECK_EQUAL(reader.Remaining(), 34);
200 std::optional<std::string> line2{reader.ReadLine()};
201 BOOST_CHECK_EQUAL(reader.Remaining(), 15);
202 std::optional<std::string> line3{reader.ReadLine()};
203 std::optional<std::string> line4{reader.ReadLine()};
204 BOOST_CHECK(line1);
205 BOOST_CHECK(line2);
206 BOOST_CHECK(line3);
207 BOOST_CHECK(!line4);
208 BOOST_CHECK_EQUAL(line1.value(), "once upon a time");
209 BOOST_CHECK_EQUAL(line2.value(), "there was a dog");
210 BOOST_CHECK_EQUAL(line3.value(), "who liked food");
211 }
212 {
213 // Do not exceed max_line_length + 1 while searching for \n
214 // Test with 22-character line + \n + 23-character line + \n
215 const std::vector<std::byte> input{StringToBuffer("once upon a time there\nwas a dog who liked tea\n")};
216
217 LineReader reader1(input, /*max_line_length=*/22);
218 // First line is exactly the length of max_line_length
219 BOOST_CHECK_EQUAL(reader1.ReadLine(), "once upon a time there");
220 // Second line is +1 character too long
221 BOOST_CHECK_EXCEPTION(reader1.ReadLine(), std::runtime_error, HasReason{"max_line_length exceeded by LineReader"});
222
223 // Increase max_line_length by 1
224 LineReader reader2(input, /*max_line_length=*/23);
225 // Both lines fit within limit
226 BOOST_CHECK_EQUAL(reader2.ReadLine(), "once upon a time there");
227 BOOST_CHECK_EQUAL(reader2.ReadLine(), "was a dog who liked tea");
228 // End of buffer reached
229 BOOST_CHECK(!reader2.ReadLine());
230 }
231 {
232 // Empty lines are empty
233 const std::vector<std::byte> input{StringToBuffer("\n")};
234 LineReader reader(input, /*max_line_length=*/1024);
235 BOOST_CHECK_EQUAL(reader.ReadLine(), "");
236 BOOST_CHECK(!reader.ReadLine());
237 }
238 {
239 // Empty buffers are null
240 const std::vector<std::byte> input{StringToBuffer("")};
241 LineReader reader(input, /*max_line_length=*/1024);
242 BOOST_CHECK(!reader.ReadLine());
243 }
244 {
245 // Even one character is too long, if it's not \n
246 const std::vector<std::byte> input{StringToBuffer("ab\n")};
247 LineReader reader(input, /*max_line_length=*/1);
248 // First line is +1 character too long
249 BOOST_CHECK_EXCEPTION(reader.ReadLine(), std::runtime_error, HasReason{"max_line_length exceeded by LineReader"});
250 }
251 {
252 const std::vector<std::byte> input{StringToBuffer("a\nb\n")};
253 LineReader reader(input, /*max_line_length=*/1);
254 BOOST_CHECK_EQUAL(reader.ReadLine(), "a");
255 BOOST_CHECK_EQUAL(reader.ReadLine(), "b");
256 BOOST_CHECK(!reader.ReadLine());
257 }
258 {
259 // If ReadLine fails, the iterator is reset and we can ReadLength instead
260 const std::vector<std::byte> input{StringToBuffer("a\nbaboon\n")};
261 LineReader reader(input, /*max_line_length=*/1);
262 BOOST_CHECK_EQUAL(reader.ReadLine(), "a");
263 // "baboon" is too long
264 BOOST_CHECK_EXCEPTION(reader.ReadLine(), std::runtime_error, HasReason{"max_line_length exceeded by LineReader"});
265 BOOST_CHECK_EQUAL(reader.ReadLength(1), "b");
266 BOOST_CHECK_EQUAL(reader.ReadLength(1), "a");
267 BOOST_CHECK_EQUAL(reader.ReadLength(2), "bo");
268 // "on" is too long
269 BOOST_CHECK_EXCEPTION(reader.ReadLine(), std::runtime_error, HasReason{"max_line_length exceeded by LineReader"});
270 BOOST_CHECK_EQUAL(reader.ReadLength(1), "o");
271 BOOST_CHECK_EQUAL(reader.ReadLine(), "n"); // now the remainder of the buffer fits in one line
272 BOOST_CHECK(!reader.ReadLine());
273 }
274 {
275 // The end of the buffer (EOB) does not count as end of line \n
276 const std::vector<std::byte> input{StringToBuffer("once upon a time there")};
277
278 LineReader reader(input, /*max_line_length=*/22);
279 // First line is exactly the length of max_line_length, but that doesn't matter because \n is missing
280 BOOST_CHECK(!reader.ReadLine());
281 // Data can still be read using ReadLength
282 BOOST_CHECK_EQUAL(reader.ReadLength(22), "once upon a time there");
283 // End of buffer reached
284 BOOST_CHECK_EQUAL(reader.Remaining(), 0);
285 }
286 {
287 // Read specific number of bytes regardless of max_line_length or \n unless buffer is too short
288 const std::vector<std::byte> input{StringToBuffer("once upon a time\n there was a dog \r\nwho liked food")};
289 LineReader reader(input, /*max_line_length=*/1);
290 BOOST_CHECK_EQUAL(reader.ReadLength(0), "");
291 BOOST_CHECK_EQUAL(reader.ReadLength(3), "onc");
292 BOOST_CHECK_EQUAL(reader.ReadLength(8), "e upon a");
293 BOOST_CHECK_EQUAL(reader.ReadLength(8), " time\n t");
294 BOOST_CHECK_EXCEPTION(reader.ReadLength(128), std::runtime_error, HasReason{"Not enough data in buffer"});
295 // After the error the iterator is reset so we can try again
296 BOOST_CHECK_EQUAL(reader.ReadLength(31), "here was a dog \r\nwho liked food");
297 // End of buffer reached
298 BOOST_CHECK_EQUAL(reader.Remaining(), 0);
299 }
300}
301
ArgsManager & args
Definition: bitcoind.cpp:277
BOOST_CHECK_EXCEPTION predicates to check the specific validation error.
Definition: common.h:18
BOOST_AUTO_TEST_SUITE_END()
void format(std::ostream &out, FormatStringCheck< sizeof...(Args)> fmt, const Args &... args)
Format list of arguments to the stream according to given format string.
Definition: tinyformat.h:1079
static constexpr void CheckNumFormatSpecifiers(const char *str)
Definition: string.h:23
#define BOOST_CHECK_EQUAL(v1, v2)
Definition: object.cpp:17
#define BOOST_CHECK_NO_THROW(stmt)
Definition: object.cpp:27
#define BOOST_CHECK(expr)
Definition: object.cpp:16
A wrapper for a compile-time partially validated format string.
Definition: string.h:93
const char *const fmt
Definition: string.h:94
size_t Remaining() const
Returns remaining size of bytes in buffer.
Definition: string.cpp:66
std::string ReadLength(size_t len)
Returns string from current iterator position of specified length if possible and advances iterator o...
Definition: string.cpp:57
std::optional< std::string > ReadLine()
Returns a string from current iterator position up to (but not including) next and advances iterator...
Definition: string.cpp:20
BOOST_AUTO_TEST_CASE(ConstevalFormatString_NumSpec)
void TfmFormatZeroes(const std::string &fmt)
std::vector< std::byte > StringToBuffer(const std::string &str)
void PassFmt(ConstevalFormatString< NumArgs > fmt)
void FailFmtWithError(const char *wrong_fmt, std::string_view error)