364 lines
8.9 KiB
C++
364 lines
8.9 KiB
C++
// This file Copyright © 2008-2023 Mnemosyne LLC.
|
|
// It may be used under GPLv2 (SPDX: GPL-2.0-only), GPLv3 (SPDX: GPL-3.0-only),
|
|
// or any future license endorsed by Mnemosyne LLC.
|
|
// License text can be found in the licenses/ folder.
|
|
|
|
#include <algorithm>
|
|
#include <array>
|
|
#include <cctype> /* isdigit() */
|
|
#include <cstddef> // size_t, std::byte
|
|
#include <cstdint> // int64_t
|
|
#include <deque>
|
|
#include <string>
|
|
#include <string_view>
|
|
#include <optional>
|
|
|
|
#include <fmt/core.h>
|
|
#include <fmt/compile.h>
|
|
|
|
#define LIBTRANSMISSION_VARIANT_MODULE
|
|
|
|
#include "libtransmission/benc.h"
|
|
#include "libtransmission/quark.h"
|
|
#include "libtransmission/tr-buffer.h"
|
|
#include "libtransmission/utils.h"
|
|
#include "libtransmission/variant.h"
|
|
|
|
struct tr_error;
|
|
|
|
using namespace std::literals;
|
|
|
|
auto constexpr MaxBencStrLength = size_t{ 128 * 1024 * 1024 }; // arbitrary
|
|
|
|
// ---
|
|
|
|
namespace transmission::benc::impl
|
|
{
|
|
|
|
/**
|
|
* The initial i and trailing e are beginning and ending delimiters.
|
|
* You can have negative numbers such as i-3e. You cannot prefix the
|
|
* number with a zero such as i04e. However, i0e is valid.
|
|
* Example: i3e represents the integer "3"
|
|
*
|
|
* The maximum number of bit of this integer is unspecified,
|
|
* but to handle it as a signed 64bit integer is mandatory to handle
|
|
* "large files" aka .torrent for more that 4Gbyte
|
|
*/
|
|
std::optional<int64_t> ParseInt(std::string_view* benc)
|
|
{
|
|
auto constexpr Prefix = "i"sv;
|
|
auto constexpr Suffix = "e"sv;
|
|
|
|
// find the beginning delimiter
|
|
auto walk = *benc;
|
|
if (std::size(walk) < 3 || !tr_strv_starts_with(walk, Prefix))
|
|
{
|
|
return {};
|
|
}
|
|
|
|
// find the ending delimiter
|
|
walk.remove_prefix(std::size(Prefix));
|
|
if (auto const pos = walk.find(Suffix); pos == std::string_view::npos)
|
|
{
|
|
return {};
|
|
}
|
|
|
|
// leading zeroes are not allowed
|
|
if ((walk[0] == '0' && (isdigit(static_cast<unsigned char>(walk[1])) != 0)) ||
|
|
(walk[0] == '-' && walk[1] == '0' && (isdigit(static_cast<unsigned char>(walk[2])) != 0)))
|
|
{
|
|
return {};
|
|
}
|
|
|
|
// parse the string and make sure the next char is `Suffix`
|
|
auto const value = tr_num_parse<int64_t>(walk, &walk);
|
|
if (!value || !tr_strv_starts_with(walk, Suffix))
|
|
{
|
|
return {};
|
|
}
|
|
|
|
walk.remove_prefix(std::size(Suffix));
|
|
*benc = walk;
|
|
return *value;
|
|
}
|
|
|
|
/**
|
|
* Byte strings are encoded as follows:
|
|
* <string length encoded in base ten ASCII>:<string data>
|
|
* Note that there is no constant beginning delimiter, and no ending delimiter.
|
|
* Example: 4:spam represents the string "spam"
|
|
*/
|
|
std::optional<std::string_view> ParseString(std::string_view* benc)
|
|
{
|
|
// find the ':' delimiter
|
|
auto const colon_pos = benc->find(':');
|
|
if (colon_pos == std::string_view::npos)
|
|
{
|
|
return {};
|
|
}
|
|
|
|
// get the string length
|
|
auto svtmp = benc->substr(0, colon_pos);
|
|
if (!std::all_of(std::begin(svtmp), std::end(svtmp), [](auto ch) { return isdigit(static_cast<unsigned char>(ch)) != 0; }))
|
|
{
|
|
return {};
|
|
}
|
|
|
|
auto const len = tr_num_parse<size_t>(svtmp, &svtmp);
|
|
if (!len || *len >= MaxBencStrLength)
|
|
{
|
|
return {};
|
|
}
|
|
|
|
// do we have `len` bytes of string data?
|
|
svtmp = benc->substr(colon_pos + 1);
|
|
if (std::size(svtmp) < len)
|
|
{
|
|
return {};
|
|
}
|
|
|
|
auto const string = svtmp.substr(0, *len);
|
|
*benc = svtmp.substr(*len);
|
|
return string;
|
|
}
|
|
|
|
} // namespace transmission::benc::impl
|
|
|
|
// ---
|
|
|
|
namespace
|
|
{
|
|
namespace parse_helpers
|
|
{
|
|
struct MyHandler : public transmission::benc::Handler
|
|
{
|
|
tr_variant* const top_;
|
|
bool inplace_;
|
|
std::deque<tr_variant*> stack_;
|
|
std::optional<tr_quark> key_;
|
|
|
|
MyHandler(tr_variant* top, bool inplace)
|
|
: top_{ top }
|
|
, inplace_{ inplace }
|
|
{
|
|
}
|
|
|
|
MyHandler(MyHandler&&) = delete;
|
|
MyHandler(MyHandler const&) = delete;
|
|
MyHandler& operator=(MyHandler&&) = delete;
|
|
MyHandler& operator=(MyHandler const&) = delete;
|
|
|
|
~MyHandler() override = default;
|
|
|
|
bool Int64(int64_t value, Context const& /*context*/) final
|
|
{
|
|
auto* const variant = get_node();
|
|
if (variant == nullptr)
|
|
{
|
|
return false;
|
|
}
|
|
|
|
tr_variantInitInt(variant, value);
|
|
return true;
|
|
}
|
|
|
|
bool String(std::string_view sv, Context const& /*context*/) final
|
|
{
|
|
auto* const variant = get_node();
|
|
if (variant == nullptr)
|
|
{
|
|
return false;
|
|
}
|
|
|
|
if (inplace_)
|
|
{
|
|
tr_variantInitStrView(variant, sv);
|
|
}
|
|
else
|
|
{
|
|
tr_variantInitStr(variant, sv);
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
bool StartDict(Context const& /*context*/) final
|
|
{
|
|
auto* const variant = get_node();
|
|
if (variant == nullptr)
|
|
{
|
|
return false;
|
|
}
|
|
|
|
tr_variantInitDict(variant, 0);
|
|
stack_.push_back(variant);
|
|
return true;
|
|
}
|
|
|
|
bool Key(std::string_view sv, Context const& /*context*/) final
|
|
{
|
|
key_ = tr_quark_new(sv);
|
|
|
|
return true;
|
|
}
|
|
|
|
bool EndDict(Context const& /*context*/) final
|
|
{
|
|
if (std::empty(stack_))
|
|
{
|
|
return false;
|
|
}
|
|
|
|
stack_.pop_back();
|
|
return true;
|
|
}
|
|
|
|
bool StartArray(Context const& /*context*/) final
|
|
{
|
|
auto* const variant = get_node();
|
|
if (variant == nullptr)
|
|
{
|
|
return false;
|
|
}
|
|
|
|
tr_variantInitList(variant, 0);
|
|
stack_.push_back(variant);
|
|
return true;
|
|
}
|
|
|
|
bool EndArray(Context const& /*context*/) final
|
|
{
|
|
if (std::empty(stack_))
|
|
{
|
|
return false;
|
|
}
|
|
|
|
stack_.pop_back();
|
|
return true;
|
|
}
|
|
|
|
private:
|
|
tr_variant* get_node()
|
|
{
|
|
tr_variant* node = nullptr;
|
|
|
|
if (std::empty(stack_))
|
|
{
|
|
node = top_;
|
|
}
|
|
else if (auto* parent = stack_.back(); tr_variantIsList(parent))
|
|
{
|
|
node = tr_variantListAdd(parent);
|
|
}
|
|
else if (key_ && tr_variantIsDict(parent))
|
|
{
|
|
node = tr_variantDictAdd(parent, *key_);
|
|
key_.reset();
|
|
}
|
|
|
|
return node;
|
|
}
|
|
};
|
|
} // namespace parse_helpers
|
|
} // namespace
|
|
|
|
std::optional<tr_variant> tr_variant_serde::parse_benc(std::string_view input)
|
|
{
|
|
using namespace parse_helpers;
|
|
using Stack = transmission::benc::ParserStack<512>;
|
|
|
|
auto top = tr_variant{};
|
|
auto stack = Stack{};
|
|
auto handler = MyHandler{ &top, parse_inplace_ };
|
|
if (transmission::benc::parse(input, stack, handler, &end_, &error_) && std::empty(stack))
|
|
{
|
|
return std::optional<tr_variant>{ std::move(top) };
|
|
}
|
|
|
|
return {};
|
|
}
|
|
|
|
// ---
|
|
|
|
namespace
|
|
{
|
|
namespace to_string_helpers
|
|
{
|
|
using OutBuf = libtransmission::StackBuffer<1024U * 8U, std::byte>;
|
|
|
|
void saveIntFunc(tr_variant const& /*var*/, int64_t const val, void* vout)
|
|
{
|
|
auto out = static_cast<OutBuf*>(vout);
|
|
|
|
auto const [buf, buflen] = out->reserve_space(64U);
|
|
auto* walk = reinterpret_cast<char*>(buf);
|
|
auto const* const begin = walk;
|
|
walk = fmt::format_to(walk, FMT_COMPILE("i{:d}e"), val);
|
|
out->commit_space(walk - begin);
|
|
}
|
|
|
|
void saveBoolFunc(tr_variant const& /*var*/, bool const val, void* vout)
|
|
{
|
|
static_cast<OutBuf*>(vout)->add(val ? "i1e"sv : "i0e"sv);
|
|
}
|
|
|
|
void saveStringImpl(OutBuf* out, std::string_view sv)
|
|
{
|
|
// `${sv.size()}:${sv}`
|
|
auto const [buf, buflen] = out->reserve_space(std::size(sv) + 32U);
|
|
auto* begin = reinterpret_cast<char*>(buf);
|
|
auto* const end = fmt::format_to(begin, FMT_COMPILE("{:d}:{:s}"), std::size(sv), sv);
|
|
out->commit_space(end - begin);
|
|
}
|
|
|
|
void saveStringFunc(tr_variant const& /*var*/, std::string_view const val, void* vout)
|
|
{
|
|
saveStringImpl(static_cast<OutBuf*>(vout), val);
|
|
}
|
|
|
|
void saveRealFunc(tr_variant const& /*val*/, double const val, void* vout)
|
|
{
|
|
// the benc spec doesn't handle floats; save it as a string.
|
|
auto buf = std::array<char, 64>{};
|
|
auto const* const out = fmt::format_to(std::data(buf), FMT_COMPILE("{:f}"), val);
|
|
saveStringImpl(static_cast<OutBuf*>(vout), { std::data(buf), static_cast<size_t>(out - std::data(buf)) });
|
|
}
|
|
|
|
void saveDictBeginFunc(tr_variant const& /*val*/, void* vbuf)
|
|
{
|
|
static_cast<OutBuf*>(vbuf)->push_back('d');
|
|
}
|
|
|
|
void saveListBeginFunc(tr_variant const& /*val*/, void* vbuf)
|
|
{
|
|
static_cast<OutBuf*>(vbuf)->push_back('l');
|
|
}
|
|
|
|
void saveContainerEndFunc(tr_variant const& /*val*/, void* vbuf)
|
|
{
|
|
static_cast<OutBuf*>(vbuf)->push_back('e');
|
|
}
|
|
|
|
} // namespace to_string_helpers
|
|
} // namespace
|
|
|
|
std::string tr_variant_serde::to_benc_string(tr_variant const& var)
|
|
{
|
|
using namespace to_string_helpers;
|
|
|
|
static auto constexpr Funcs = WalkFuncs{
|
|
saveIntFunc, //
|
|
saveBoolFunc, //
|
|
saveRealFunc, //
|
|
saveStringFunc, //
|
|
saveDictBeginFunc, //
|
|
saveListBeginFunc, //
|
|
saveContainerEndFunc, //
|
|
};
|
|
|
|
auto buf = OutBuf{};
|
|
walk(var, Funcs, &buf, true);
|
|
return buf.to_string();
|
|
}
|