Files
imhex/lib/libimhex/source/helpers/encoding_file.cpp
iTrooz e5d9d9ec9e chore: apply more complicated lints (#2576)
<!--
Please provide as much information as possible about what your PR aims
to do.
PRs with no description will most likely be closed until more
information is provided.
If you're planing on changing fundamental behaviour or add big new
features, please open a GitHub Issue first before starting to work on
it.
If it's not something big and you still want to contact us about it,
feel free to do so !
-->

### Problem description
<!-- Describe the bug that you fixed/feature request that you
implemented, or link to an existing issue describing it -->

### Implementation description
<!-- Explain what you did to correct the problem -->

### Screenshots
<!-- If your change is visual, take a screenshot showing it. Ideally,
make before/after sceenshots -->

### Additional things
<!-- Anything else you would like to say -->
2025-12-21 20:55:50 +01:00

168 lines
5.0 KiB
C++

#include <hex/helpers/encoding_file.hpp>
#include <hex/helpers/utils.hpp>
#include <ranges>
#include <wolv/io/file.hpp>
#include <wolv/utils/string.hpp>
namespace hex {
EncodingFile::EncodingFile() : m_mapping(std::make_unique<std::map<size_t, std::map<std::vector<u8>, std::string>>>()) {
}
EncodingFile::EncodingFile(const hex::EncodingFile &other) {
m_mapping = std::make_unique<std::map<size_t, std::map<std::vector<u8>, std::string>>>(*other.m_mapping);
m_tableContent = other.m_tableContent;
m_longestSequence = other.m_longestSequence;
m_shortestSequence = other.m_shortestSequence;
m_valid = other.m_valid;
m_name = other.m_name;
}
EncodingFile::EncodingFile(EncodingFile &&other) noexcept {
m_mapping = std::move(other.m_mapping);
m_tableContent = std::move(other.m_tableContent);
m_longestSequence = other.m_longestSequence;
m_shortestSequence = other.m_shortestSequence;
m_valid = other.m_valid;
m_name = std::move(other.m_name);
}
EncodingFile::EncodingFile(Type type, const std::fs::path &path) : EncodingFile() {
auto file = wolv::io::File(path, wolv::io::File::Mode::Read);
switch (type) {
case Type::Thingy:
parse(file.readString());
break;
default:
return;
}
{
m_name = path.stem().string();
m_name = wolv::util::replaceStrings(m_name, "_", " ");
if (!m_name.empty())
m_name[0] = std::toupper(m_name[0]);
}
m_valid = true;
}
EncodingFile::EncodingFile(Type type, const std::string &content) : EncodingFile() {
switch (type) {
case Type::Thingy:
parse(content);
break;
default:
return;
}
m_name = "Unknown";
m_valid = true;
}
EncodingFile &EncodingFile::operator=(const hex::EncodingFile &other) {
if(this == &other) {
return *this;
}
m_mapping = std::make_unique<std::map<size_t, std::map<std::vector<u8>, std::string>>>(*other.m_mapping);
m_tableContent = other.m_tableContent;
m_longestSequence = other.m_longestSequence;
m_shortestSequence = other.m_shortestSequence;
m_valid = other.m_valid;
m_name = other.m_name;
return *this;
}
EncodingFile &EncodingFile::operator=(EncodingFile &&other) noexcept {
m_mapping = std::move(other.m_mapping);
m_tableContent = std::move(other.m_tableContent);
m_longestSequence = other.m_longestSequence;
m_shortestSequence = other.m_shortestSequence;
m_valid = other.m_valid;
m_name = std::move(other.m_name);
return *this;
}
std::pair<std::string_view, size_t> EncodingFile::getEncodingFor(std::span<const u8> buffer) const {
for (const auto &[size, mapping] : std::ranges::reverse_view(*m_mapping)) {
if (size > buffer.size()) continue;
std::vector key(buffer.begin(), buffer.begin() + size);
if (mapping.contains(key))
return { mapping.at(key), size };
}
return { ".", 1 };
}
u64 EncodingFile::getEncodingLengthFor(std::span<u8> buffer) const {
for (const auto& [size, mapping] : std::ranges::reverse_view(*m_mapping)) {
if (size > buffer.size()) continue;
std::vector key(buffer.begin(), buffer.begin() + size);
if (mapping.contains(key))
return size;
}
return 1;
}
std::string EncodingFile::decodeAll(std::span<const u8> buffer) const {
std::string result;
while (!buffer.empty()) {
const auto [character, size] = getEncodingFor(buffer);
result += character;
buffer = buffer.subspan(size);
}
return result;
}
void EncodingFile::parse(const std::string &content) {
m_tableContent = content;
for (const auto &line : wolv::util::splitString(m_tableContent, "\n")) {
std::string from, to;
{
auto delimiterPos = line.find('=');
if (delimiterPos >= line.length())
continue;
from = line.substr(0, delimiterPos);
to = line.substr(delimiterPos + 1);
if (from.empty()) continue;
}
auto fromBytes = hex::parseByteString(from);
if (fromBytes.empty()) continue;
if (to.length() > 1)
to = wolv::util::trim(to);
if (to.empty())
to = " ";
if (!m_mapping->contains(fromBytes.size()))
m_mapping->insert({ fromBytes.size(), {} });
u64 keySize = fromBytes.size();
(*m_mapping)[keySize].insert({ std::move(fromBytes), to });
m_longestSequence = std::max(m_longestSequence, keySize);
m_shortestSequence = std::min(m_shortestSequence, keySize);
}
}
}