#include "runtime/helpers/spy_input.h" #include #include #include "utf8proc.h" #include using std::string; static const size_t UTF8_MAX_CHAR_SIZE = 4; size_t SpyInput::char_count(const string &text) { const char *bytes = text.data(); size_t len = text.size(); size_t character = 0, byte = 0; int32_t dest_char; while (byte < len) { byte += utf8proc_iterate( (uint8_t *)bytes + byte, len - byte, &dest_char); character++; } return character; } static long byte_for_character(const char *str, size_t len, size_t goal_character) { size_t character = 0, byte = 0; int32_t dest_char; while (character < goal_character) { if (byte >= len) return -1; byte += utf8proc_iterate( (uint8_t *)str + byte, len - byte, &dest_char); character++; } return byte; } SpyInput::SpyInput(string content, size_t chars_per_chunk) : chars_per_chunk(chars_per_chunk), buffer_size(UTF8_MAX_CHAR_SIZE * chars_per_chunk), buffer(new char[buffer_size]), byte_offset(0), content(content), strings_read({""}) {} SpyInput::~SpyInput() { delete buffer; } const char * SpyInput::read(void *payload, size_t *bytes_read) { auto spy = static_cast(payload); if (spy->byte_offset > spy->content.size()) { *bytes_read = 0; return ""; } const char *start = spy->content.data() + spy->byte_offset; long byte_count = byte_for_character(start, spy->content.size() - spy->byte_offset, spy->chars_per_chunk); if (byte_count < 0) byte_count = spy->content.size() - spy->byte_offset; *bytes_read = byte_count; spy->byte_offset += byte_count; spy->strings_read.back() += string(start, byte_count); /* * This class stores its entire `content` in a contiguous buffer, but we want * to ensure that the code under test cannot accidentally read more than * `*bytes_read` bytes past the returned pointer. To make sure that this type * of error does not fly, we copy the chunk into a zeroed-out buffer and * return a reference to that buffer, rather than a pointer into the main * content. */ memset(spy->buffer, 0, spy->buffer_size); memcpy(spy->buffer, start, byte_count); return spy->buffer; } int SpyInput::seek(void *payload, size_t character, size_t byte) { auto spy = static_cast(payload); if (spy->strings_read.size() == 0 || spy->strings_read.back().size() > 0) spy->strings_read.push_back(""); spy->byte_offset = byte; return 0; } TSInput SpyInput::input() { TSInput result; result.payload = this; result.seek_fn = seek; result.read_fn = read; return result; } TSInputEdit SpyInput::replace(size_t start_char, size_t chars_removed, string text) { string text_removed = swap_substr(start_char, chars_removed, text); size_t chars_inserted = SpyInput::char_count(text); undo_stack.push_back(SpyInputEdit{start_char, chars_inserted, text_removed}); return {start_char, chars_inserted, chars_removed}; } TSInputEdit SpyInput::undo() { SpyInputEdit entry = undo_stack.back(); undo_stack.pop_back(); swap_substr(entry.position, entry.chars_removed, entry.text_inserted); size_t chars_inserted = SpyInput::char_count(entry.text_inserted); return TSInputEdit{entry.position, chars_inserted, entry.chars_removed}; } string SpyInput::swap_substr(size_t start_char, size_t chars_removed, string text) { const char *bytes = content.data(); size_t size = content.size(); long start_byte = byte_for_character(bytes, size, start_char); assert(start_byte >= 0); long bytes_removed = byte_for_character(bytes + start_byte, size - start_byte, chars_removed); if (bytes_removed < 0) bytes_removed = size - start_byte; string text_removed = content.substr(start_byte, bytes_removed); content.erase(start_byte, bytes_removed); content.insert(start_byte, text); return text_removed; } void SpyInput::clear() { strings_read.clear(); }