mirror of
https://github.com/WerWolv/ImHex.git
synced 2026-03-28 15:57:03 -05:00
<!-- Please provide as much information as possible about what your PR aims to do. PRs with no description will most likely be closed until more information is provided. If you're planing on changing fundamental behaviour or add big new features, please open a GitHub Issue first before starting to work on it. If it's not something big and you still want to contact us about it, feel free to do so ! --> ### Problem description <!-- Describe the bug that you fixed/feature request that you implemented, or link to an existing issue describing it --> ### Implementation description <!-- Explain what you did to correct the problem --> ### Screenshots <!-- If your change is visual, take a screenshot showing it. Ideally, make before/after sceenshots --> ### Additional things <!-- Anything else you would like to say -->
168 lines
5.0 KiB
C++
168 lines
5.0 KiB
C++
#include <hex/helpers/encoding_file.hpp>
|
|
|
|
#include <hex/helpers/utils.hpp>
|
|
|
|
#include <ranges>
|
|
#include <wolv/io/file.hpp>
|
|
#include <wolv/utils/string.hpp>
|
|
|
|
namespace hex {
|
|
|
|
EncodingFile::EncodingFile() : m_mapping(std::make_unique<std::map<size_t, std::map<std::vector<u8>, std::string>>>()) {
|
|
|
|
}
|
|
|
|
EncodingFile::EncodingFile(const hex::EncodingFile &other) {
|
|
m_mapping = std::make_unique<std::map<size_t, std::map<std::vector<u8>, std::string>>>(*other.m_mapping);
|
|
m_tableContent = other.m_tableContent;
|
|
m_longestSequence = other.m_longestSequence;
|
|
m_shortestSequence = other.m_shortestSequence;
|
|
m_valid = other.m_valid;
|
|
m_name = other.m_name;
|
|
}
|
|
|
|
EncodingFile::EncodingFile(EncodingFile &&other) noexcept {
|
|
m_mapping = std::move(other.m_mapping);
|
|
m_tableContent = std::move(other.m_tableContent);
|
|
m_longestSequence = other.m_longestSequence;
|
|
m_shortestSequence = other.m_shortestSequence;
|
|
m_valid = other.m_valid;
|
|
m_name = std::move(other.m_name);
|
|
}
|
|
|
|
EncodingFile::EncodingFile(Type type, const std::fs::path &path) : EncodingFile() {
|
|
auto file = wolv::io::File(path, wolv::io::File::Mode::Read);
|
|
switch (type) {
|
|
case Type::Thingy:
|
|
parse(file.readString());
|
|
break;
|
|
default:
|
|
return;
|
|
}
|
|
|
|
{
|
|
m_name = path.stem().string();
|
|
m_name = wolv::util::replaceStrings(m_name, "_", " ");
|
|
|
|
if (!m_name.empty())
|
|
m_name[0] = std::toupper(m_name[0]);
|
|
}
|
|
|
|
m_valid = true;
|
|
}
|
|
|
|
EncodingFile::EncodingFile(Type type, const std::string &content) : EncodingFile() {
|
|
switch (type) {
|
|
case Type::Thingy:
|
|
parse(content);
|
|
break;
|
|
default:
|
|
return;
|
|
}
|
|
|
|
m_name = "Unknown";
|
|
m_valid = true;
|
|
}
|
|
|
|
|
|
EncodingFile &EncodingFile::operator=(const hex::EncodingFile &other) {
|
|
if(this == &other) {
|
|
return *this;
|
|
}
|
|
m_mapping = std::make_unique<std::map<size_t, std::map<std::vector<u8>, std::string>>>(*other.m_mapping);
|
|
m_tableContent = other.m_tableContent;
|
|
m_longestSequence = other.m_longestSequence;
|
|
m_shortestSequence = other.m_shortestSequence;
|
|
m_valid = other.m_valid;
|
|
m_name = other.m_name;
|
|
|
|
return *this;
|
|
}
|
|
|
|
EncodingFile &EncodingFile::operator=(EncodingFile &&other) noexcept {
|
|
m_mapping = std::move(other.m_mapping);
|
|
m_tableContent = std::move(other.m_tableContent);
|
|
m_longestSequence = other.m_longestSequence;
|
|
m_shortestSequence = other.m_shortestSequence;
|
|
m_valid = other.m_valid;
|
|
m_name = std::move(other.m_name);
|
|
|
|
return *this;
|
|
}
|
|
|
|
|
|
|
|
std::pair<std::string_view, size_t> EncodingFile::getEncodingFor(std::span<const u8> buffer) const {
|
|
for (const auto &[size, mapping] : std::ranges::reverse_view(*m_mapping)) {
|
|
if (size > buffer.size()) continue;
|
|
|
|
std::vector key(buffer.begin(), buffer.begin() + size);
|
|
if (mapping.contains(key))
|
|
return { mapping.at(key), size };
|
|
}
|
|
|
|
return { ".", 1 };
|
|
}
|
|
|
|
u64 EncodingFile::getEncodingLengthFor(std::span<u8> buffer) const {
|
|
for (const auto& [size, mapping] : std::ranges::reverse_view(*m_mapping)) {
|
|
if (size > buffer.size()) continue;
|
|
|
|
std::vector key(buffer.begin(), buffer.begin() + size);
|
|
if (mapping.contains(key))
|
|
return size;
|
|
}
|
|
|
|
return 1;
|
|
}
|
|
|
|
std::string EncodingFile::decodeAll(std::span<const u8> buffer) const {
|
|
std::string result;
|
|
|
|
while (!buffer.empty()) {
|
|
const auto [character, size] = getEncodingFor(buffer);
|
|
result += character;
|
|
buffer = buffer.subspan(size);
|
|
}
|
|
|
|
return result;
|
|
}
|
|
|
|
|
|
void EncodingFile::parse(const std::string &content) {
|
|
m_tableContent = content;
|
|
for (const auto &line : wolv::util::splitString(m_tableContent, "\n")) {
|
|
|
|
std::string from, to;
|
|
{
|
|
auto delimiterPos = line.find('=');
|
|
|
|
if (delimiterPos >= line.length())
|
|
continue;
|
|
|
|
from = line.substr(0, delimiterPos);
|
|
to = line.substr(delimiterPos + 1);
|
|
|
|
if (from.empty()) continue;
|
|
}
|
|
|
|
auto fromBytes = hex::parseByteString(from);
|
|
if (fromBytes.empty()) continue;
|
|
|
|
if (to.length() > 1)
|
|
to = wolv::util::trim(to);
|
|
if (to.empty())
|
|
to = " ";
|
|
|
|
if (!m_mapping->contains(fromBytes.size()))
|
|
m_mapping->insert({ fromBytes.size(), {} });
|
|
|
|
u64 keySize = fromBytes.size();
|
|
(*m_mapping)[keySize].insert({ std::move(fromBytes), to });
|
|
|
|
m_longestSequence = std::max(m_longestSequence, keySize);
|
|
m_shortestSequence = std::min(m_shortestSequence, keySize);
|
|
}
|
|
}
|
|
|
|
} |