Bitcoin Core 28.99.0
P2P Digital Currency
streams.h
Go to the documentation of this file.
1// Copyright (c) 2009-2010 Satoshi Nakamoto
2// Copyright (c) 2009-2022 The Bitcoin Core developers
3// Distributed under the MIT software license, see the accompanying
4// file COPYING or http://www.opensource.org/licenses/mit-license.php.
5
6#ifndef BITCOIN_STREAMS_H
7#define BITCOIN_STREAMS_H
8
9#include <serialize.h>
10#include <span.h>
12#include <util/overflow.h>
13
14#include <algorithm>
15#include <assert.h>
16#include <cstddef>
17#include <cstdio>
18#include <ios>
19#include <limits>
20#include <optional>
21#include <stdint.h>
22#include <string.h>
23#include <string>
24#include <utility>
25#include <vector>
26
27namespace util {
28inline void Xor(Span<std::byte> write, Span<const std::byte> key, size_t key_offset = 0)
29{
30 if (key.size() == 0) {
31 return;
32 }
33 key_offset %= key.size();
34
35 for (size_t i = 0, j = key_offset; i != write.size(); i++) {
36 write[i] ^= key[j++];
37
38 // This potentially acts on very many bytes of data, so it's
39 // important that we calculate `j`, i.e. the `key` index in this
40 // way instead of doing a %, which would effectively be a division
41 // for each byte Xor'd -- much slower than need be.
42 if (j == key.size())
43 j = 0;
44 }
45}
46} // namespace util
47
48/* Minimal stream for overwriting and/or appending to an existing byte vector
49 *
50 * The referenced vector will grow as necessary
51 */
53{
54public:
55/*
56 * @param[in] vchDataIn Referenced byte vector to overwrite/append
57 * @param[in] nPosIn Starting position. Vector index where writes should start. The vector will initially
58 * grow as necessary to max(nPosIn, vec.size()). So to append, use vec.size().
59*/
60 VectorWriter(std::vector<unsigned char>& vchDataIn, size_t nPosIn) : vchData{vchDataIn}, nPos{nPosIn}
61 {
62 if(nPos > vchData.size())
63 vchData.resize(nPos);
64 }
65/*
66 * (other params same as above)
67 * @param[in] args A list of items to serialize starting at nPosIn.
68*/
69 template <typename... Args>
70 VectorWriter(std::vector<unsigned char>& vchDataIn, size_t nPosIn, Args&&... args) : VectorWriter{vchDataIn, nPosIn}
71 {
72 ::SerializeMany(*this, std::forward<Args>(args)...);
73 }
75 {
76 assert(nPos <= vchData.size());
77 size_t nOverwrite = std::min(src.size(), vchData.size() - nPos);
78 if (nOverwrite) {
79 memcpy(vchData.data() + nPos, src.data(), nOverwrite);
80 }
81 if (nOverwrite < src.size()) {
82 vchData.insert(vchData.end(), UCharCast(src.data()) + nOverwrite, UCharCast(src.data() + src.size()));
83 }
84 nPos += src.size();
85 }
86 template <typename T>
88 {
89 ::Serialize(*this, obj);
90 return (*this);
91 }
92
93private:
94 std::vector<unsigned char>& vchData;
95 size_t nPos;
96};
97
101{
102private:
104
105public:
110
111 template<typename T>
113 {
114 ::Unserialize(*this, obj);
115 return (*this);
116 }
117
118 size_t size() const { return m_data.size(); }
119 bool empty() const { return m_data.empty(); }
120
122 {
123 if (dst.size() == 0) {
124 return;
125 }
126
127 // Read from the beginning of the buffer
128 if (dst.size() > m_data.size()) {
129 throw std::ios_base::failure("SpanReader::read(): end of data");
130 }
131 memcpy(dst.data(), m_data.data(), dst.size());
132 m_data = m_data.subspan(dst.size());
133 }
134
135 void ignore(size_t n)
136 {
137 m_data = m_data.subspan(n);
138 }
139};
140
147{
148protected:
151 vector_type::size_type m_read_pos{0};
152
153public:
154 typedef vector_type::allocator_type allocator_type;
155 typedef vector_type::size_type size_type;
156 typedef vector_type::difference_type difference_type;
157 typedef vector_type::reference reference;
158 typedef vector_type::const_reference const_reference;
159 typedef vector_type::value_type value_type;
160 typedef vector_type::iterator iterator;
161 typedef vector_type::const_iterator const_iterator;
162 typedef vector_type::reverse_iterator reverse_iterator;
163
164 explicit DataStream() = default;
166 explicit DataStream(Span<const value_type> sp) : vch(sp.data(), sp.data() + sp.size()) {}
167
168 std::string str() const
169 {
170 return std::string{UCharCast(data()), UCharCast(data() + size())};
171 }
172
173
174 //
175 // Vector subset
176 //
177 const_iterator begin() const { return vch.begin() + m_read_pos; }
178 iterator begin() { return vch.begin() + m_read_pos; }
179 const_iterator end() const { return vch.end(); }
180 iterator end() { return vch.end(); }
181 size_type size() const { return vch.size() - m_read_pos; }
182 bool empty() const { return vch.size() == m_read_pos; }
183 void resize(size_type n, value_type c = value_type{}) { vch.resize(n + m_read_pos, c); }
184 void reserve(size_type n) { vch.reserve(n + m_read_pos); }
185 const_reference operator[](size_type pos) const { return vch[pos + m_read_pos]; }
187 void clear() { vch.clear(); m_read_pos = 0; }
188 value_type* data() { return vch.data() + m_read_pos; }
189 const value_type* data() const { return vch.data() + m_read_pos; }
190
191 inline void Compact()
192 {
193 vch.erase(vch.begin(), vch.begin() + m_read_pos);
194 m_read_pos = 0;
195 }
196
197 bool Rewind(std::optional<size_type> n = std::nullopt)
198 {
199 // Total rewind if no size is passed
200 if (!n) {
201 m_read_pos = 0;
202 return true;
203 }
204 // Rewind by n characters if the buffer hasn't been compacted yet
205 if (*n > m_read_pos)
206 return false;
207 m_read_pos -= *n;
208 return true;
209 }
210
211
212 //
213 // Stream subset
214 //
215 bool eof() const { return size() == 0; }
216 int in_avail() const { return size(); }
217
219 {
220 if (dst.size() == 0) return;
221
222 // Read from the beginning of the buffer
223 auto next_read_pos{CheckedAdd(m_read_pos, dst.size())};
224 if (!next_read_pos.has_value() || next_read_pos.value() > vch.size()) {
225 throw std::ios_base::failure("DataStream::read(): end of data");
226 }
227 memcpy(dst.data(), &vch[m_read_pos], dst.size());
228 if (next_read_pos.value() == vch.size()) {
229 m_read_pos = 0;
230 vch.clear();
231 return;
232 }
233 m_read_pos = next_read_pos.value();
234 }
235
236 void ignore(size_t num_ignore)
237 {
238 // Ignore from the beginning of the buffer
239 auto next_read_pos{CheckedAdd(m_read_pos, num_ignore)};
240 if (!next_read_pos.has_value() || next_read_pos.value() > vch.size()) {
241 throw std::ios_base::failure("DataStream::ignore(): end of data");
242 }
243 if (next_read_pos.value() == vch.size()) {
244 m_read_pos = 0;
245 vch.clear();
246 return;
247 }
248 m_read_pos = next_read_pos.value();
249 }
250
252 {
253 // Write to the end of the buffer
254 vch.insert(vch.end(), src.begin(), src.end());
255 }
256
257 template<typename T>
259 {
260 ::Serialize(*this, obj);
261 return (*this);
262 }
263
264 template<typename T>
266 {
267 ::Unserialize(*this, obj);
268 return (*this);
269 }
270
276 void Xor(const std::vector<unsigned char>& key)
277 {
279 }
280
282 size_t GetMemoryUsage() const noexcept;
283};
284
285template <typename IStream>
287{
288private:
289 IStream& m_istream;
290
293 uint8_t m_buffer{0};
294
298 int m_offset{8};
299
300public:
301 explicit BitStreamReader(IStream& istream) : m_istream(istream) {}
302
306 uint64_t Read(int nbits) {
307 if (nbits < 0 || nbits > 64) {
308 throw std::out_of_range("nbits must be between 0 and 64");
309 }
310
311 uint64_t data = 0;
312 while (nbits > 0) {
313 if (m_offset == 8) {
314 m_istream >> m_buffer;
315 m_offset = 0;
316 }
317
318 int bits = std::min(8 - m_offset, nbits);
319 data <<= bits;
320 data |= static_cast<uint8_t>(m_buffer << m_offset) >> (8 - bits);
321 m_offset += bits;
322 nbits -= bits;
323 }
324 return data;
325 }
326};
327
328template <typename OStream>
330{
331private:
332 OStream& m_ostream;
333
336 uint8_t m_buffer{0};
337
341 int m_offset{0};
342
343public:
344 explicit BitStreamWriter(OStream& ostream) : m_ostream(ostream) {}
345
347 {
348 Flush();
349 }
350
354 void Write(uint64_t data, int nbits) {
355 if (nbits < 0 || nbits > 64) {
356 throw std::out_of_range("nbits must be between 0 and 64");
357 }
358
359 while (nbits > 0) {
360 int bits = std::min(8 - m_offset, nbits);
361 m_buffer |= (data << (64 - nbits)) >> (64 - 8 + m_offset);
362 m_offset += bits;
363 nbits -= bits;
364
365 if (m_offset == 8) {
366 Flush();
367 }
368 }
369 }
370
374 void Flush() {
375 if (m_offset == 0) {
376 return;
377 }
378
379 m_ostream << m_buffer;
380 m_buffer = 0;
381 m_offset = 0;
382 }
383};
384
392{
393protected:
394 std::FILE* m_file;
395 std::vector<std::byte> m_xor;
396 std::optional<int64_t> m_position;
397
398public:
399 explicit AutoFile(std::FILE* file, std::vector<std::byte> data_xor={});
400
401 ~AutoFile() { fclose(); }
402
403 // Disallow copies
404 AutoFile(const AutoFile&) = delete;
405 AutoFile& operator=(const AutoFile&) = delete;
406
407 bool feof() const { return std::feof(m_file); }
408
409 int fclose()
410 {
411 if (auto rel{release()}) return std::fclose(rel);
412 return 0;
413 }
414
419 std::FILE* release()
420 {
421 std::FILE* ret{m_file};
422 m_file = nullptr;
423 return ret;
424 }
425
428 bool IsNull() const { return m_file == nullptr; }
429
431 void SetXor(std::vector<std::byte> data_xor) { m_xor = data_xor; }
432
434 std::size_t detail_fread(Span<std::byte> dst);
435
437 void seek(int64_t offset, int origin);
438
440 int64_t tell();
441
443 bool Commit();
444
446 bool Truncate(unsigned size);
447
448 //
449 // Stream subset
450 //
451 void read(Span<std::byte> dst);
452 void ignore(size_t nSize);
454
455 template <typename T>
456 AutoFile& operator<<(const T& obj)
457 {
458 ::Serialize(*this, obj);
459 return *this;
460 }
461
462 template <typename T>
464 {
465 ::Unserialize(*this, obj);
466 return *this;
467 }
468};
469
477{
478private:
480 uint64_t nSrcPos{0};
481 uint64_t m_read_pos{0};
482 uint64_t nReadLimit;
483 uint64_t nRewind;
484 std::vector<std::byte> vchBuf;
485
487 bool Fill() {
488 unsigned int pos = nSrcPos % vchBuf.size();
489 unsigned int readNow = vchBuf.size() - pos;
490 unsigned int nAvail = vchBuf.size() - (nSrcPos - m_read_pos) - nRewind;
491 if (nAvail < readNow)
492 readNow = nAvail;
493 if (readNow == 0)
494 return false;
495 size_t nBytes{m_src.detail_fread(Span{vchBuf}.subspan(pos, readNow))};
496 if (nBytes == 0) {
497 throw std::ios_base::failure{m_src.feof() ? "BufferedFile::Fill: end of file" : "BufferedFile::Fill: fread failed"};
498 }
499 nSrcPos += nBytes;
500 return true;
501 }
502
508 std::pair<std::byte*, size_t> AdvanceStream(size_t length)
509 {
510 assert(m_read_pos <= nSrcPos);
511 if (m_read_pos + length > nReadLimit) {
512 throw std::ios_base::failure("Attempt to position past buffer limit");
513 }
514 // If there are no bytes available, read from the file.
515 if (m_read_pos == nSrcPos && length > 0) Fill();
516
517 size_t buffer_offset{static_cast<size_t>(m_read_pos % vchBuf.size())};
518 size_t buffer_available{static_cast<size_t>(vchBuf.size() - buffer_offset)};
519 size_t bytes_until_source_pos{static_cast<size_t>(nSrcPos - m_read_pos)};
520 size_t advance{std::min({length, buffer_available, bytes_until_source_pos})};
521 m_read_pos += advance;
522 return std::make_pair(&vchBuf[buffer_offset], advance);
523 }
524
525public:
526 BufferedFile(AutoFile& file, uint64_t nBufSize, uint64_t nRewindIn)
527 : m_src{file}, nReadLimit{std::numeric_limits<uint64_t>::max()}, nRewind{nRewindIn}, vchBuf(nBufSize, std::byte{0})
528 {
529 if (nRewindIn >= nBufSize)
530 throw std::ios_base::failure("Rewind limit must be less than buffer size");
531 }
532
534 bool eof() const {
535 return m_read_pos == nSrcPos && m_src.feof();
536 }
537
540 {
541 while (dst.size() > 0) {
542 auto [buffer_pointer, length]{AdvanceStream(dst.size())};
543 memcpy(dst.data(), buffer_pointer, length);
544 dst = dst.subspan(length);
545 }
546 }
547
550 void SkipTo(const uint64_t file_pos)
551 {
552 assert(file_pos >= m_read_pos);
553 while (m_read_pos < file_pos) AdvanceStream(file_pos - m_read_pos);
554 }
555
557 uint64_t GetPos() const {
558 return m_read_pos;
559 }
560
562 bool SetPos(uint64_t nPos) {
563 size_t bufsize = vchBuf.size();
564 if (nPos + bufsize < nSrcPos) {
565 // rewinding too far, rewind as far as possible
566 m_read_pos = nSrcPos - bufsize;
567 return false;
568 }
569 if (nPos > nSrcPos) {
570 // can't go this far forward, go as far as possible
571 m_read_pos = nSrcPos;
572 return false;
573 }
574 m_read_pos = nPos;
575 return true;
576 }
577
580 bool SetLimit(uint64_t nPos = std::numeric_limits<uint64_t>::max()) {
581 if (nPos < m_read_pos)
582 return false;
583 nReadLimit = nPos;
584 return true;
585 }
586
587 template<typename T>
589 ::Unserialize(*this, obj);
590 return (*this);
591 }
592
594 void FindByte(std::byte byte)
595 {
596 // For best performance, avoid mod operation within the loop.
597 size_t buf_offset{size_t(m_read_pos % uint64_t(vchBuf.size()))};
598 while (true) {
599 if (m_read_pos == nSrcPos) {
600 // No more bytes available; read from the file into the buffer,
601 // setting nSrcPos to one beyond the end of the new data.
602 // Throws exception if end-of-file reached.
603 Fill();
604 }
605 const size_t len{std::min<size_t>(vchBuf.size() - buf_offset, nSrcPos - m_read_pos)};
606 const auto it_start{vchBuf.begin() + buf_offset};
607 const auto it_find{std::find(it_start, it_start + len, byte)};
608 const size_t inc{size_t(std::distance(it_start, it_find))};
609 m_read_pos += inc;
610 if (inc < len) break;
611 buf_offset += inc;
612 if (buf_offset >= vchBuf.size()) buf_offset = 0;
613 }
614 }
615};
616
617#endif // BITCOIN_STREAMS_H
int ret
ArgsManager & args
Definition: bitcoind.cpp:277
Non-refcounted RAII wrapper for FILE*.
Definition: streams.h:392
bool feof() const
Definition: streams.h:407
std::FILE * release()
Get wrapped FILE* with transfer of ownership.
Definition: streams.h:419
AutoFile & operator=(const AutoFile &)=delete
std::vector< std::byte > m_xor
Definition: streams.h:395
~AutoFile()
Definition: streams.h:401
std::FILE * m_file
Definition: streams.h:394
AutoFile & operator<<(const T &obj)
Definition: streams.h:456
AutoFile(const AutoFile &)=delete
bool IsNull() const
Return true if the wrapped FILE* is nullptr, false otherwise.
Definition: streams.h:428
AutoFile & operator>>(T &&obj)
Definition: streams.h:463
void SetXor(std::vector< std::byte > data_xor)
Continue with a different XOR key.
Definition: streams.h:431
std::size_t detail_fread(Span< std::byte > dst)
Implementation detail, only used internally.
Definition: streams.cpp:21
std::optional< int64_t > m_position
Definition: streams.h:396
int fclose()
Definition: streams.h:409
uint64_t Read(int nbits)
Read the specified number of bits from the stream.
Definition: streams.h:306
BitStreamReader(IStream &istream)
Definition: streams.h:301
IStream & m_istream
Definition: streams.h:289
void Write(uint64_t data, int nbits)
Write the nbits least significant bits of a 64-bit int to the output stream.
Definition: streams.h:354
OStream & m_ostream
Definition: streams.h:332
BitStreamWriter(OStream &ostream)
Definition: streams.h:344
void Flush()
Flush any unwritten bits to the output stream, padding with 0's to the next byte boundary.
Definition: streams.h:374
Wrapper around an AutoFile& that implements a ring buffer to deserialize from.
Definition: streams.h:477
std::vector< std::byte > vchBuf
the buffer
Definition: streams.h:484
std::pair< std::byte *, size_t > AdvanceStream(size_t length)
Advance the stream's read pointer (m_read_pos) by up to 'length' bytes, filling the buffer from the f...
Definition: streams.h:508
uint64_t nRewind
how many bytes we guarantee to rewind
Definition: streams.h:483
bool eof() const
check whether we're at the end of the source file
Definition: streams.h:534
bool SetLimit(uint64_t nPos=std::numeric_limits< uint64_t >::max())
prevent reading beyond a certain position no argument removes the limit
Definition: streams.h:580
BufferedFile & operator>>(T &&obj)
Definition: streams.h:588
uint64_t GetPos() const
return the current reading position
Definition: streams.h:557
uint64_t nReadLimit
up to which position we're allowed to read
Definition: streams.h:482
void read(Span< std::byte > dst)
read a number of bytes
Definition: streams.h:539
void SkipTo(const uint64_t file_pos)
Move the read position ahead in the stream to the given position.
Definition: streams.h:550
void FindByte(std::byte byte)
search for a given byte in the stream, and remain positioned on it
Definition: streams.h:594
BufferedFile(AutoFile &file, uint64_t nBufSize, uint64_t nRewindIn)
Definition: streams.h:526
bool Fill()
read data from the source to fill the buffer
Definition: streams.h:487
AutoFile & m_src
Definition: streams.h:479
bool SetPos(uint64_t nPos)
rewind to a given reading position
Definition: streams.h:562
Double ended buffer combining vector and stream-like interfaces.
Definition: streams.h:147
void write(Span< const value_type > src)
Definition: streams.h:251
DataStream & operator<<(const T &obj)
Definition: streams.h:258
bool empty() const
Definition: streams.h:182
vector_type::difference_type difference_type
Definition: streams.h:156
size_type size() const
Definition: streams.h:181
DataStream & operator>>(T &&obj)
Definition: streams.h:265
reference operator[](size_type pos)
Definition: streams.h:186
void resize(size_type n, value_type c=value_type{})
Definition: streams.h:183
const_reference operator[](size_type pos) const
Definition: streams.h:185
void Xor(const std::vector< unsigned char > &key)
XOR the contents of this stream with a certain key.
Definition: streams.h:276
DataStream(Span< const value_type > sp)
Definition: streams.h:166
vector_type::size_type size_type
Definition: streams.h:155
SerializeData vector_type
Definition: streams.h:149
vector_type vch
Definition: streams.h:150
const value_type * data() const
Definition: streams.h:189
vector_type::const_reference const_reference
Definition: streams.h:158
value_type * data()
Definition: streams.h:188
vector_type::const_iterator const_iterator
Definition: streams.h:161
DataStream(Span< const uint8_t > sp)
Definition: streams.h:165
void reserve(size_type n)
Definition: streams.h:184
vector_type::reverse_iterator reverse_iterator
Definition: streams.h:162
iterator begin()
Definition: streams.h:178
const_iterator begin() const
Definition: streams.h:177
void read(Span< value_type > dst)
Definition: streams.h:218
vector_type::size_type m_read_pos
Definition: streams.h:151
vector_type::iterator iterator
Definition: streams.h:160
vector_type::value_type value_type
Definition: streams.h:159
bool eof() const
Definition: streams.h:215
std::string str() const
Definition: streams.h:168
void ignore(size_t num_ignore)
Definition: streams.h:236
vector_type::allocator_type allocator_type
Definition: streams.h:154
const_iterator end() const
Definition: streams.h:179
void Compact()
Definition: streams.h:191
void clear()
Definition: streams.h:187
size_t GetMemoryUsage() const noexcept
Compute total memory usage of this object (own memory + any dynamic memory).
Definition: streams.cpp:115
iterator end()
Definition: streams.h:180
bool Rewind(std::optional< size_type > n=std::nullopt)
Definition: streams.h:197
DataStream()=default
vector_type::reference reference
Definition: streams.h:157
int in_avail() const
Definition: streams.h:216
A Span is an object that can refer to a contiguous sequence of objects.
Definition: span.h:98
constexpr std::size_t size() const noexcept
Definition: span.h:187
CONSTEXPR_IF_NOT_DEBUG Span< C > subspan(std::size_t offset) const noexcept
Definition: span.h:195
constexpr C * data() const noexcept
Definition: span.h:174
constexpr C * begin() const noexcept
Definition: span.h:175
constexpr bool empty() const noexcept
Definition: span.h:189
constexpr C * end() const noexcept
Definition: span.h:176
Minimal stream for reading from an existing byte array by Span.
Definition: streams.h:101
bool empty() const
Definition: streams.h:119
SpanReader & operator>>(T &&obj)
Definition: streams.h:112
size_t size() const
Definition: streams.h:118
SpanReader(Span< const unsigned char > data)
Definition: streams.h:109
Span< const unsigned char > m_data
Definition: streams.h:103
void ignore(size_t n)
Definition: streams.h:135
void read(Span< std::byte > dst)
Definition: streams.h:121
std::vector< unsigned char > & vchData
Definition: streams.h:94
VectorWriter & operator<<(const T &obj)
Definition: streams.h:87
size_t nPos
Definition: streams.h:95
void write(Span< const std::byte > src)
Definition: streams.h:74
VectorWriter(std::vector< unsigned char > &vchDataIn, size_t nPosIn, Args &&... args)
Definition: streams.h:70
VectorWriter(std::vector< unsigned char > &vchDataIn, size_t nPosIn)
Definition: streams.h:60
void Xor(Span< std::byte > write, Span< const std::byte > key, size_t key_offset=0)
Definition: streams.h:28
std::optional< T > CheckedAdd(const T i, const T j) noexcept
Definition: overflow.h:26
void Serialize(Stream &, V)=delete
void SerializeMany(Stream &s, const Args &... args)
Support for (un)serializing many things at once.
Definition: serialize.h:994
void Unserialize(Stream &, V)=delete
Span< const std::byte > MakeByteSpan(V &&v) noexcept
Definition: span.h:269
Span< const std::byte > AsBytes(Span< T > s) noexcept
Definition: span.h:258
unsigned char * UCharCast(char *c)
Definition: span.h:280
Span< std::byte > MakeWritableByteSpan(V &&v) noexcept
Definition: span.h:274
assert(!tx.IsCoinBase())
std::vector< std::byte, zero_after_free_allocator< std::byte > > SerializeData
Byte-vector that clears its contents before deletion.
Definition: zeroafterfree.h:49