This library for C++20 and newer assists reading from and writing to binary data, making use of my own experience as a reverse engineer.
It aims to:
- Make use of modern C++ features where useful (i.e.
std::endian
and co.). - Be as open-purposed as possible for a wide range of use cases.
- Mirror the standard library's style for interface.
- Receive updates as necessary.
Here is the full list of includes used by this library:
#include <bit>
#include <cstring>
#include <fstream>
#include <cstdint>
#include <string_view>
#include <type_traits>
#include <vector>
Otherwise, no external dependencies are used.
With a single header file at only ~10KB, it's very easy to start using this library. Support for build systems like CMake may be added in the future.
#include <kojo/binary.hpp> // or something along those lines.
A binary
class is provided, under the kojo
namespace, and can be initialised via a file path as an std::string
, the address of the start of some data, or another binary
object.
Alternatively, you can default initialise, and instead use .load()
later on. Note that this will clear any data you may have had loaded into the object previously.
#include <kojo/binary.hpp>
int main() {
std::vector<char> some_data = {'S', 'o', 'm', 'e', ' ', 'd', 'a', 't', 'a', '.'};
// Initialising
kojo::binary from_file{"./example/file/path.bin"};
kojo::binary from_address{some_data.data()};
kojo::binary from_object{from_file};
// Using `load()`
kojo::binary from_file;
from_file.load("./example/file/path.bin");
kojo::binary from_address;
from_address.load(some_data.data());
kojo::binary load_from_object;
from_object.load(&from_file);
}
Here is a list of every publicly-accessible element for the binary
class, with examples:
The constructor. Either initialises a binary
object that is empty, or with either a file (via filepath) or binary data.
binary();
binary(std::string path_input, size_t start = 0, size_t size = -1);
binary(void* pointer, size_t start = 0, size_t size = -1);
binary(binary& binary_data, size_t start = 0, size_t size = -1);
// Initialise as empty:
kojo::binary ex_empty;
// Initialise from filepath:
kojo::binary ex_filepath{"./example/file/path.bin"};
std::filesystem::path path = "another/example/file/path.bin";
kojo::binary ex_fspath{path.string()};
// Initialise from address:
std::vector<char> vec = {'S', 'o', 'm', 'e', ' ', 'd', 'a', 't', 'a', '.'};
kojo::binary ex_vector{vec.data(), 0, vec.size()};
kojo::binary ex_vectorsect{vec.data(), 5, 4}; // Only contains "data"
// Initialise from another binary object:
kojo::binary ex_object{ex_vector}; // Contains "Some data."
Same as the constructors, but can be used after initialisation, clearing all existing data.
void load(std::string path_input, size_t start = 0, size_t size = -1);
void load(void* pointer, size_t start = 0, size_t size = -1);
void load(binary& binary_data, size_t start = 0, size_t size = -1);
kojo::binary foo;
// Load from filepath:
foo.load("./example/file/path.bin");
std::filesystem::path path = "another/example/file/path.bin";
foo.load(path.string());
// Load from address:
std::vector<char> vec = {'S', 'o', 'm', 'e', ' ', 'd', 'a', 't', 'a', '.'};
foo.load(vec.data(), 0, vec.size());
foo.load(vec.data(), 5, 4); // Only contains "data"
// Load from another binary object:
kojo::binary boo{vec.data(), 0, vec.size()};
foo.load(boo); // Contains "Some data."
Clears all stored data and resets the position back to 0.
void clear();
kojo::binary writer;
writer.write<std::string>("Gone... Reduced to atoms.");
writer.clear();
writer.write<std::string>("Out with the old...");
kojo::binary reader{writer};
std::cout << reader.read<std::string>(); // "Out with the old..."
Returns a pointer to the data accessed by the object, whether that be internally or externally stored.
unsigned char* data();
kojo::binary foo;
foo.write<char>('B');
foo.write<std::string>("azinga!");
std::cout << foo.data(); // "Bazinga!"
Returns the size of the internally-stored data if existing, or -1
otherwise.
size_t size();
kojo::binary foo;
foo.write<std::uint64_t>(23, std::endian::big);
foo.write<std::uint32_t>(420, std::endian::big);
std::cout << foo.size(); // 12
Sets the endianness of an integer to big or little. Mostly exists for internal use.
template <typename T> T set_endian(T value, std::endian endianness);
static_assert(std::is_integral<T>::value, "T must be an integral type.");
kojo::binary foo;
std::uint32_t number = foo.set_endian(1, std::endian::big); // 00 00 00 01
number = foo.set_endian(number, std::endian::little); // 01 00 00 00
Reads from data into a specified type, that being an integer, char
, or std::string
.
template <typename T> T read(std::endian endianness, size_t offset = 0);
static_assert(std::is_integral<T>::value, "T must be an integral type.");
template <typename T> typename std::enable_if<std::is_same<T, char>::value, char>::type read(size_t offset = 0);
template <typename T> typename std::enable_if<std::is_same<T, std::string>::value, std::string>::type read(size_t size = 0, size_t offset = 0);
std::vector<char> vec{17, 1, 0, 0, 'h', 'P', 'N', 'G', 'J', 'o', 'h', 'n', '\0', 'B'};
kojo::binary foo{vec.data(), 0, vec.size()};
std::cout << foo.read<std::uint32_t>(std::endian::little); // 273
std::cout << foo.read<char>(); // 'h'
std::cout << foo.read<std::string>(3); // "PNG"
std::cout << foo.read<std::string>(); // "John"
Writes specified data at the end of the internally-stored data. Cannot overwrite.
template <typename T> void write(T value, endian endianness);
static_assert(std::is_integral<T>::value, "T must be an integral type.");
template <typename T> void write(typename std::enable_if<std::is_same<T, char>::value, char>::type value);
template <typename T> void write(typename std::enable_if<std::is_same<T, std::string>::value, std::string>::type value, size_t length = 0);
template <typename T> void write(typename std::enable_if<std::is_same<T, std::vector<unsigned char>>::value, std::vector<unsigned char>>::type& value);
kojo::binary foo;
foo.write<std::int64_t>(-281029, std::endian::big);
foo.write<std::uint16_t>(934, std::endian::little);
foo.write<char>('E');
foo.write<std::string>("Die Speisekarte, bitte."); // Null-terminated.
foo.write<std::string>("NUCC", 4); // Not null-terminated.
std::vector<unsigned char> vec{'a', 'B', 'c', 'D'};
foo.write<std::vector<unsigned char>>(vec);
Returns the current position in the data.
size_t get_pos();
kojo::binary foo;
std::cout << foo.get_pos(); // 0
foo.write<std::uint32_t>(5, std::endian::big);
std::cout << foo.get_pos(); // 4
foo.write<std::string>("YouGotCAGEd");
std::cout << foo.get_pos(); // 16
Sets the current position in the data.
void set_pos(size_t pos);
kojo::binary foo;
foo.write<std::string>("Goodbye JoJo!");
foo.set_pos(0);
std::cout << foo.read<std::string>(); // "Goodbye JoJo!"
Changes the position in data by an offset, positive or negative.
void change_pos(std::int64_t offset);
kojo::binary foo;
foo.write<std::string>("Goodbye JoJo!");
foo.set_pos(0);
foo.change_pos(8);
std::cout << foo.read<std::string>(); // "JoJo!"
Changes the position in data to the next multiple of a specified integer.
void align_by(size_t bytes);
kojo::binary foo;
foo.write<std::string>("ABCDEFGHGood grief.");
foo.set_pos(0);
foo.change_pos(5);
foo.align_by(4);
std::cout << foo.read<std::string>(); // "Good grief."
Outputs the data to a file at a specified path.
void dump_file(std::string output_path);
kojo::binary foo;
foo.write<std::string>("Coca Cola espuma");
foo.dump_file("./some_path.bin");