slige/runtime/vm.hpp

282 lines
7.5 KiB
C++
Raw Normal View History

2024-11-08 11:22:42 +00:00
#pragma once
2024-11-26 13:32:21 +00:00
#include "alloc.hpp"
2024-11-08 11:22:42 +00:00
#include "arch.hpp"
2024-11-19 04:06:27 +00:00
#include "json.hpp"
2024-11-08 11:22:42 +00:00
#include "value.hpp"
#include <cstddef>
#include <cstdint>
2024-12-13 19:05:27 +00:00
#include <cstdio>
2024-11-19 04:06:27 +00:00
#include <string>
2024-12-16 17:23:51 +00:00
#include <utility>
2024-11-08 11:22:42 +00:00
#include <vector>
namespace sliger {
2024-11-18 14:01:24 +00:00
struct SourcePos {
int index;
int line;
int col;
};
struct FGNode {
2024-11-19 04:06:27 +00:00
FGNode(uint32_t fn, size_t parent)
: fn(fn)
, parent(parent)
{
}
2024-11-18 14:01:24 +00:00
uint32_t fn;
2024-11-19 04:06:27 +00:00
int64_t acc = 0;
int64_t ic_start = 0;
2024-11-18 14:01:24 +00:00
size_t parent;
2024-11-19 04:06:27 +00:00
// the vector's data may be placed all over the heap. this really really
// sucks. expect cachemisses when calling infrequently called functions. we
// might be lucky, that the current function and frequent call paths will be
// cached, but we have no way to assure this.
//
// maybe to fix this, a many-to-many relation table, using one single
// vector could be used. that would reduce cache misses, in exchange for
// table lookups.
std::vector<size_t> children = {};
};
class FlameGraphBuilder : public json::ToAndFromJson {
public:
inline void report_call(uint32_t fn, int64_t ic_start)
{
size_t found = find_or_create_child(fn);
this->nodes[found].ic_start = ic_start;
this->current = found;
}
inline void report_return(int64_t ic_end)
{
int64_t diff = ic_end - this->nodes[this->current].ic_start;
this->nodes[this->current].acc += diff;
this->current = this->nodes[this->current].parent;
}
2024-11-21 03:12:07 +00:00
inline void calculate_midway_result(int64_t ic)
{
calculate_node_midway_result(ic, this->current);
}
2024-11-19 04:06:27 +00:00
void to_json(json::Writer& writer) const override;
private:
inline auto find_or_create_child(uint32_t fn) -> size_t
{
auto found_child_index = this->find_child(fn);
if (found_child_index.has_value())
return found_child_index.value();
size_t new_child_index = this->nodes.size();
this->nodes.push_back(FGNode(fn, this->current));
this->nodes[this->current].children.push_back(new_child_index);
return new_child_index;
}
inline auto find_child(uint32_t fn) const -> std::optional<size_t>
{
for (auto child_idx : this->nodes[this->current].children) {
if (fn == this->nodes[child_idx].fn) {
return child_idx;
}
}
return {};
}
2024-11-21 03:12:07 +00:00
inline void calculate_node_midway_result(int64_t ic, size_t node_index)
{
2024-12-15 03:24:07 +00:00
int64_t diff = ic - this->nodes[node_index].ic_start;
this->nodes[node_index].acc += diff;
this->nodes[node_index].ic_start = ic;
if (node_index == 0)
2024-11-21 03:12:07 +00:00
return;
2024-12-15 03:24:07 +00:00
calculate_node_midway_result(ic, this->nodes[node_index].parent);
2024-11-21 03:12:07 +00:00
}
2024-11-19 04:06:27 +00:00
void fg_node_to_json(json::Writer& writer, size_t node_index) const;
std::vector<FGNode> nodes = { FGNode(0, 0) };
size_t current = 0;
};
struct CCPosEntry {
SourcePos pos;
int64_t covers = 0;
2024-11-18 14:01:24 +00:00
};
2024-11-19 04:06:27 +00:00
class CodeCoverageBuilder : public json::ToAndFromJson {
2024-11-18 14:01:24 +00:00
public:
2024-12-16 17:23:51 +00:00
inline void make_sure_entry_exists(SourcePos pos)
{
find_or_create_entry(pos);
}
2024-11-19 04:06:27 +00:00
/// call when leaving a source location
inline void report_cover(SourcePos pos)
{
size_t entry_index = find_or_create_entry(pos);
this->entries[entry_index].covers += 1;
}
2024-11-18 14:01:24 +00:00
2024-11-19 04:06:27 +00:00
void to_json(json::Writer& writer) const override;
2024-11-18 14:01:24 +00:00
private:
2024-11-19 04:06:27 +00:00
inline size_t find_or_create_entry(SourcePos pos)
{
if (auto found_index = find_pos_entry(pos); found_index.has_value())
return found_index.value();
size_t new_index = this->entries.size();
this->entries.push_back({ .pos = pos });
return new_index;
}
inline std::optional<size_t> find_pos_entry(SourcePos pos) const
{
for (size_t i = 0; i < this->entries.size(); ++i)
if (this->entries[i].pos.index == pos.index)
return i;
return {};
}
std::vector<CCPosEntry> entries = {};
2024-11-18 14:01:24 +00:00
};
struct VMOpts {
2024-11-19 04:06:27 +00:00
bool flame_graph;
bool code_coverage;
2024-12-13 19:17:22 +00:00
bool print_debug;
2024-11-18 14:01:24 +00:00
};
2024-11-08 11:22:42 +00:00
class VM {
public:
2024-12-15 02:07:33 +00:00
VM(std::vector<uint32_t> program, VMOpts opts)
2024-11-18 14:01:24 +00:00
: opts(opts)
2024-12-15 02:07:33 +00:00
, program(std::move(program))
2024-11-08 11:22:42 +00:00
{
}
2024-11-19 04:06:27 +00:00
void run_until_done();
void run_n_instructions(size_t amount);
void run_instruction();
2024-12-15 02:07:33 +00:00
inline auto done() const -> bool
{
return this->pc >= this->program.size();
}
2024-12-15 00:32:21 +00:00
2024-11-19 04:06:27 +00:00
inline auto flame_graph_json() const -> std::string
{
return json::to_json(this->flame_graph);
}
2024-12-16 17:23:51 +00:00
inline auto code_coverage_json() -> std::string
2024-11-19 04:06:27 +00:00
{
2024-12-16 17:23:51 +00:00
for (size_t i = 0; i < this->program.size(); ++i) {
if (this->program.at(i) == std::to_underlying(Op::SourceMap)
&& this->program.size() - 1 - i >= 3) {
auto index = static_cast<int32_t>(this->program.at(i + 1));
auto line = static_cast<int32_t>(this->program.at(i + 2));
auto col = static_cast<int32_t>(this->program.at(i + 3));
this->code_coverage.make_sure_entry_exists(
{ index, line, col });
}
i += instruction_size(i);
}
2024-11-19 04:06:27 +00:00
return json::to_json(this->code_coverage);
}
inline auto view_stack() const -> const std::vector<Value>&
{
return this->stack;
}
2024-12-13 15:11:16 +00:00
auto stack_repr_string(size_t max_items) const -> std::string;
2024-11-19 04:06:27 +00:00
private:
2024-12-10 23:18:51 +00:00
void run_builtin(Builtin builtin_id);
2024-12-13 19:05:27 +00:00
void run_string_builtin(Builtin builtin_id);
void run_array_builtin(Builtin builtin_id);
2024-12-31 02:38:38 +00:00
void run_struct_builtin(Builtin builtin_id);
2024-12-13 19:05:27 +00:00
void run_file_builtin(Builtin builtin_id);
2024-12-10 23:18:51 +00:00
2024-11-08 11:22:42 +00:00
inline void step() { this->pc += 1; }
2024-11-11 14:31:54 +00:00
inline auto eat_op() -> Op
2024-11-08 11:22:42 +00:00
{
auto value = curr_as_op();
step();
return value;
}
inline auto curr_as_op() const -> Op
{
return static_cast<Op>(this->program[this->pc]);
}
2024-11-11 14:31:54 +00:00
inline auto eat_int32() -> int32_t
{
auto value = curr_as_int32();
step();
return value;
}
inline auto curr_as_int32() const -> int32_t
{
return static_cast<int32_t>(this->program[this->pc]);
}
inline auto eat_uint32() -> uint32_t
{
auto value = curr_as_uint32();
step();
return value;
}
inline auto curr_as_uint32() const -> uint32_t
{
return this->program[this->pc];
}
inline auto fn_stack_at(size_t idx) -> Value&
{
return this->stack.at(this->bp + idx);
}
2024-12-16 17:23:51 +00:00
void assert_program_has(size_t count);
2024-12-13 15:11:16 +00:00
void assert_fn_stack_has(size_t count);
void assert_stack_has(size_t count);
2024-11-11 14:31:54 +00:00
inline void stack_push(Value&& value) { this->stack.push_back(value); }
inline void stack_push(Value& value) { this->stack.push_back(value); }
inline auto stack_pop() -> Value
{
auto value = this->stack.at(this->stack.size() - 1);
this->stack.pop_back();
return value;
}
2024-12-16 17:23:51 +00:00
size_t instruction_size(size_t i) const;
2024-11-11 14:31:54 +00:00
2024-11-18 14:01:24 +00:00
VMOpts opts;
2024-11-08 11:22:42 +00:00
uint32_t pc = 0;
2024-11-11 14:31:54 +00:00
uint32_t bp = 0;
2024-12-15 02:07:33 +00:00
std::vector<uint32_t> program;
2024-11-08 11:22:42 +00:00
std::vector<Value> stack;
2024-12-10 23:18:51 +00:00
std::vector<Value> statics;
2024-11-26 13:32:21 +00:00
heap::Heap heap;
2024-11-18 14:01:24 +00:00
SourcePos current_pos = { 0, 1, 1 };
2024-11-19 04:06:27 +00:00
int64_t instruction_counter = 0;
2024-12-13 19:05:27 +00:00
int32_t file_id_counter = 3;
std::unordered_map<int32_t, FILE*> open_files {
{ 0, stdin },
{ 1, stdout },
{ 2, stderr },
};
2024-11-19 04:06:27 +00:00
FlameGraphBuilder flame_graph;
CodeCoverageBuilder code_coverage;
2024-11-08 11:22:42 +00:00
};
2024-11-18 14:01:24 +00:00
2024-12-12 15:07:59 +00:00
auto maybe_op_to_string(uint32_t value) -> std::string;
2024-12-13 19:05:27 +00:00
auto maybe_builtin_to_string(uint32_t value) -> std::string;
2024-12-12 15:07:59 +00:00
2024-11-08 11:22:42 +00:00
}