diff options
author | Roland Reichwein <mail@reichwein.it> | 2020-11-16 12:48:44 +0100 |
---|---|---|
committer | Roland Reichwein <mail@reichwein.it> | 2020-11-16 12:48:44 +0100 |
commit | c9cb051fae190acfc36813e4a23759fb9b9c3df3 (patch) | |
tree | fcd8c93cd5dc2a3272eac253b0291611e16ea13f | |
parent | 300219dc8519720a36525c7b40c6a327580fe0bd (diff) |
Implement hierarchical evaluation (WIP)
-rw-r--r-- | asm/intel64/codes.cpp | 43 | ||||
-rw-r--r-- | asm/intel64/codes.h | 4 | ||||
-rw-r--r-- | asm/intel64/encode.cpp | 168 | ||||
-rw-r--r-- | asm/operators.cpp | 17 | ||||
-rw-r--r-- | asm/operators.h | 2 | ||||
-rw-r--r-- | asm/segment.cpp | 5 | ||||
-rw-r--r-- | asm/segment.h | 1 | ||||
-rw-r--r-- | flowgraph/node.cpp | 16 | ||||
-rw-r--r-- | flowgraph/scope.cpp | 10 | ||||
-rw-r--r-- | flowgraph/scope.h | 4 | ||||
-rw-r--r-- | flowgraph/storage.cpp | 10 | ||||
-rw-r--r-- | flowgraph/storage.h | 5 | ||||
-rw-r--r-- | minicc.cpp | 13 | ||||
-rw-r--r-- | minicc.h | 3 |
14 files changed, 218 insertions, 83 deletions
diff --git a/asm/intel64/codes.cpp b/asm/intel64/codes.cpp index 58d921f..9f82d37 100644 --- a/asm/intel64/codes.cpp +++ b/asm/intel64/codes.cpp @@ -1,5 +1,8 @@ #include "codes.h" +#include "minicc.h" +#include "../operators.h" + #include <exception> #include <unordered_map> @@ -44,12 +47,13 @@ namespace { {"rdx", 2}, {"rdi", 7}, }; -} +} // namespace // Manual, page 530 // Reg + Reg/Memory -uint8_t ModRM(const std::string& reg, const std::string& rm) { - uint8_t result{0b11000000}; // TODO: other than 11: Indexed forms of r/m +std::vector<uint8_t> ModRM(const std::string& reg, const std::string& rm, int32_t disp) { + uint8_t result{}; // MOD is highest 2 bits, then 3 bits Reg, the 3 bits R/M + std::vector<uint8_t> displacement_bytes; size_t val_reg{}; // reg @@ -60,22 +64,35 @@ uint8_t ModRM(const std::string& reg, const std::string& rm) { throw std::runtime_error("ModRM: Bad digit in arg1: "s + reg); } } else { // reg - auto index1{ IndexOfRegister.find(reg) }; - if (index1 == IndexOfRegister.end()) - throw std::runtime_error("ModRM: Unknown register for arg1: "s + reg); - val_reg = index1->second; + val_reg = RegNo(reg); } result |= (val_reg << 3); // rm - auto index2{ IndexOfRegister.find(rm) }; - if (index2 == IndexOfRegister.end()) - throw std::runtime_error("Unknown register for arg2: "s + rm); - - result |= index2->second; + if (rm.size() > 2 && rm.front() == '[' && rm.back() == ']') { // indexed / MemPtr + uint8_t rm_bits {RegNo(rm.substr(1, rm.size() - 2))}; + if (rm_bits == 4) + throw std::runtime_error("ICE: SIB byte not yet supported"); + + if (disp == 0 && rm_bits != 5) { // no displacement + // ignore: keep MOD == 00, no displacement bytes + if (rm_bits == 5) + throw std::runtime_error("ICE: [rbp] with now displacement is not supported"); // TODO: Support this, and SIB byte + } else if (disp >= -128 && disp < 128) { + result |= 0b01000000; // 8 bit displacement + displacement_bytes.push_back(uint8_t(disp)); + } else { + result |= 0b10000000; // 32 bit displacement + displacement_bytes += to_little_endian(disp); + } + result |= rm_bits; + } else { // normal register access + result |= 0b11000000; + result |= RegNo(rm); + } - return result; + return std::vector<uint8_t>{result} + displacement_bytes; } uint8_t RegNo(const std::string& reg) diff --git a/asm/intel64/codes.h b/asm/intel64/codes.h index 112eef4..ba378a6 100644 --- a/asm/intel64/codes.h +++ b/asm/intel64/codes.h @@ -9,7 +9,9 @@ std::vector<uint8_t> REX(const std::string& s); // Manual, page 530 // Reg + Reg/Memory -uint8_t ModRM(const std::string& reg, const std::string& rm); +// disp: optional, only necessary in some cases, e.g. indexed memory access +// returns: Encoded ModRM byte, followed by SIB and disp bytes, if appropriate +std::vector<uint8_t> ModRM(const std::string& reg, const std::string& rm, int32_t disp = 0); // Just the number of reg, e.g. for encoding inside primary opcode uint8_t RegNo(const std::string& reg); diff --git a/asm/intel64/encode.cpp b/asm/intel64/encode.cpp index 681e407..0806b56 100644 --- a/asm/intel64/encode.cpp +++ b/asm/intel64/encode.cpp @@ -8,6 +8,113 @@ #include <exception> +namespace { + +std::shared_ptr<Op> makeLoadValue(FlowGraph::Data& data) +{ + if (data.type() != FlowGraph::DataType::Int) { + std::runtime_error("Bad type for operand: "s + std::to_string(int(data.type()))); + } + + if (!data.storage()) + throw std::runtime_error("ICE: Operand storage is 0"); + + auto& data_storage{*data.storage()}; + if (typeid(data_storage) == typeid(FlowGraph::Constant)) { + FlowGraph::Constant& value {dynamic_cast<FlowGraph::Constant&>(data_storage)}; + if (value.value().size() < sizeof(uint32_t)) + throw std::runtime_error("ICE: Int data from operand needs at least 4 bytes, got "s + std::to_string(value.value().size())); + + uint32_t immediate = from_little_endian(value.value()); + + return makeOp("mov", Asm::Args{{Asm::Args::Register32("eax"), Asm::Args::Immediate32(immediate)}}); + } else if (typeid(data_storage) == typeid(FlowGraph::TemporaryStorage)) { + FlowGraph::TemporaryStorage& storage {dynamic_cast<FlowGraph::TemporaryStorage&>(data_storage)}; + + index_t index { storage.indexOfStorage()}; + return makeOp("mov", Asm::Args{{Asm::Args::Register32("eax"), Asm::Args::Mem32Ptr64("rbp", int32_t(index) * -4)}}); + } else + throw std::runtime_error("ICE: Unsupported type for operand data at load: "s + demangle(typeid(data_storage))); +} + +std::shared_ptr<Op> makeStoreValue(FlowGraph::Data& data) +{ + if (data.type() != FlowGraph::DataType::Int) { + std::runtime_error("Bad type for operand: "s + std::to_string(int(data.type()))); + } + + if (!data.storage()) + throw std::runtime_error("ICE: Operand storage is 0"); + + auto& data_storage{*data.storage()}; + if (typeid(data_storage) == typeid(FlowGraph::TemporaryStorage)) { + FlowGraph::TemporaryStorage& storage {dynamic_cast<FlowGraph::TemporaryStorage&>(data_storage)}; + + index_t index { storage.indexOfStorage()}; + return makeOp("mov", Asm::Args{{Asm::Args::Mem32Ptr64("rbp", int32_t(index) * -4), Asm::Args::Register32("eax")}}); + } else + throw std::runtime_error("ICE: Unsupported type for operand data at store: "s + demangle(typeid(data_storage))); +} + +std::shared_ptr<Op> makeAddValue(FlowGraph::Data& data) +{ + if (data.type() != FlowGraph::DataType::Int) { + std::runtime_error("Bad type for operand: "s + std::to_string(int(data.type()))); + } + + if (!data.storage()) + throw std::runtime_error("ICE: Operand storage is 0"); + + auto& data_storage{*data.storage()}; + if (typeid(data_storage) == typeid(FlowGraph::Constant)) { + FlowGraph::Constant& value {dynamic_cast<FlowGraph::Constant&>(data_storage)}; + if (value.value().size() < sizeof(uint32_t)) + throw std::runtime_error("ICE: Int data from operand needs at least 4 bytes, got "s + std::to_string(value.value().size())); + + uint32_t immediate = from_little_endian(value.value()); + + return makeOp("add", Asm::Args{{Asm::Args::Register32("eax"), Asm::Args::Immediate32(immediate)}}); + } else if (typeid(data_storage) == typeid(FlowGraph::TemporaryStorage)) { + FlowGraph::TemporaryStorage& storage {dynamic_cast<FlowGraph::TemporaryStorage&>(data_storage)}; + + index_t index { storage.indexOfStorage()}; + return makeOp("add", Asm::Args{{Asm::Args::Register32("eax"), Asm::Args::Mem32Ptr64("rbp", int32_t(index) * -4)}}); + } else + throw std::runtime_error("ICE: Unsupported type for operand data at add: "s + demangle(typeid(data_storage))); +} + +std::vector<std::shared_ptr<Chunk>> makeMulValue(FlowGraph::Data& data) +{ + if (data.type() != FlowGraph::DataType::Int) { + std::runtime_error("Bad type for operand: "s + std::to_string(int(data.type()))); + } + + if (!data.storage()) + throw std::runtime_error("ICE: Operand storage is 0"); + + auto& data_storage{*data.storage()}; + if (typeid(data_storage) == typeid(FlowGraph::Constant)) { + FlowGraph::Constant& value {dynamic_cast<FlowGraph::Constant&>(data_storage)}; + if (value.value().size() < sizeof(uint32_t)) + throw std::runtime_error("ICE: Int data from operand needs at least 4 bytes, got "s + std::to_string(value.value().size())); + + uint32_t immediate = from_little_endian(value.value()); + + return {{ + makeOp("mov", Asm::Args{{Asm::Args::Register32("ebx"), Asm::Args::Immediate32(immediate)}}), + makeOp("mul", Asm::Args{{Asm::Args::Register32("ebx")}}) + }}; + } else if (typeid(data_storage) == typeid(FlowGraph::TemporaryStorage)) { + FlowGraph::TemporaryStorage& storage {dynamic_cast<FlowGraph::TemporaryStorage&>(data_storage)}; + + index_t index { storage.indexOfStorage()}; + return {{makeOp("mul", Asm::Args{{Asm::Args::Mem32Ptr64("rbp", int32_t(index) * -4)}})}}; + } else + throw std::runtime_error("ICE: Unsupported type for operand data at mul: "s + demangle(typeid(data_storage))); +} + +} // namespace + void Asm::toMachineCode(const FlowGraph::Graph& graph, Segment& segment) { segment.clear(); @@ -48,61 +155,14 @@ void Asm::toMachineCode(const FlowGraph::Graph& graph, Segment& segment) auto operands {op.operands()}; -#if 0 - if (op.type() == FlowGraph::BinaryOperationType::Add) { - segment.push_back(loadmakeOp("add", Asm::Args{{Asm::Args::Register32("eax"), Asm::Args::Immediate32(immediate2)}})); - } else if (op.type() == FlowGraph::BinaryOperationType::Multiply) { - segment.push_back(makeOp("mov", Asm::Args{{Asm::Args::Register32("ebx"), Asm::Args::Immediate32(immediate2)}})); - segment.push_back(makeOp("mul", Asm::Args{{Asm::Args::Register32("ebx")}})); - } else - throw std::runtime_error("ICE: Asm: Unsupported binary operation type: "s + std::to_string(static_cast<int>(op.type()))); -#endif - - - - - if (operands[1].type() != FlowGraph::DataType::Int) { - std::runtime_error("Bad type for operand 1: "s + std::to_string(int(operands[1].type()))); - } - - if (operands[2].type() != FlowGraph::DataType::Int) { - std::runtime_error("Bad type for operand 2: "s + std::to_string(int(operands[2].type()))); - } - - if (!operands[1].storage()) - throw std::runtime_error("ICE: Operand 1 storage is 0"); - if (!operands[2].storage()) - throw std::runtime_error("ICE: Operand 2 storage is 0"); - - uint32_t immediate1{}; - try { - FlowGraph::Constant& value1 {dynamic_cast<FlowGraph::Constant&>(*operands[1].storage())}; - if (value1.value().size() < sizeof(uint32_t)) - throw std::runtime_error("ICE: Int data from operand 1 needs at least 4 bytes, got "s + std::to_string(value1.value().size())); - - immediate1 = boost::endian::little_to_native(*(reinterpret_cast<const uint32_t*>(value1.value().data()))); - } catch (const std::bad_cast& ex) { - std::runtime_error("Bad value for operand 1: Constant expected"); - } - - uint32_t immediate2{}; - try { - FlowGraph::Constant& value2 {dynamic_cast<FlowGraph::Constant&>(*operands[2].storage())}; - if (value2.value().size() < sizeof(uint32_t)) - throw std::runtime_error("ICE: Int data from operand 2 needs at least 4 bytes, got "s + std::to_string(value2.value().size())); - - immediate2 = boost::endian::little_to_native(*(reinterpret_cast<const uint32_t*>(value2.value().data()))); - } catch (const std::bad_cast& ex) { - std::runtime_error("Bad value for operand 2: Constant expected"); - } - - segment.push_back(makeOp("mov", Asm::Args{{Asm::Args::Register32("eax"), Asm::Args::Immediate32(immediate1)}})); - if (op.type() == FlowGraph::BinaryOperationType::Add) { - segment.push_back(makeOp("add", Asm::Args{{Asm::Args::Register32("eax"), Asm::Args::Immediate32(immediate2)}})); + segment.push_back(makeLoadValue(operands[1])); + segment.push_back(makeAddValue(operands[2])); + segment.push_back(makeStoreValue(operands[0])); } else if (op.type() == FlowGraph::BinaryOperationType::Multiply) { - segment.push_back(makeOp("mov", Asm::Args{{Asm::Args::Register32("ebx"), Asm::Args::Immediate32(immediate2)}})); - segment.push_back(makeOp("mul", Asm::Args{{Asm::Args::Register32("ebx")}})); + segment.push_back(makeLoadValue(operands[1])); + segment.append(makeMulValue(operands[2])); + segment.push_back(makeStoreValue(operands[0])); } else throw std::runtime_error("ICE: Asm: Unsupported binary operation type: "s + std::to_string(static_cast<int>(op.type()))); @@ -115,7 +175,7 @@ void Asm::toMachineCode(const FlowGraph::Graph& graph, Segment& segment) //FlowGraph::DestroyScopeOp& op {dynamic_cast<FlowGraph::DestroyScopeOp&>(*node)}; segment.push_back(makeOp("pop", Asm::Args{{Asm::Args::Register64("rbp")}})); - // Move eax for exit() via rdi + // Move eax (still present from last operation) for exit() via rdi segment.push_back(makeOp("xor", Asm::Args{{Asm::Args::Register64("rdi"), Asm::Args::Register64("rdi")}})); segment.push_back(makeOp("mov", Asm::Args{{Asm::Args::Register32("edi"), Asm::Args::Register32("eax")}})); } else if (typeid(node_deref) == typeid(FlowGraph::DataNode)) { diff --git a/asm/operators.cpp b/asm/operators.cpp index 9f7d5d9..9cd02a1 100644 --- a/asm/operators.cpp +++ b/asm/operators.cpp @@ -1,13 +1,26 @@ #include "operators.h" // binary code operators -std::vector<uint8_t> operator+(std::vector<uint8_t> a, const std::vector<uint8_t>& b) { +std::vector<uint8_t> operator+(std::vector<uint8_t> a, const std::vector<uint8_t>& b) +{ a.insert(a.end(), b.begin(), b.end()); return a; } -std::vector<uint8_t> operator+(std::vector<uint8_t> a, const uint8_t& b) { +std::vector<uint8_t> operator+(std::vector<uint8_t> a, const uint8_t& b) +{ a.push_back(b); return a; } +std::vector<uint8_t> operator+=(std::vector<uint8_t>& a, const std::vector<uint8_t>& b) +{ + a.insert(a.end(), b.begin(), b.end()); + return a; +} + +std::vector<uint8_t> operator+=(std::vector<uint8_t>& a, const uint8_t& b) +{ + a.push_back(b); + return a; +} diff --git a/asm/operators.h b/asm/operators.h index 741ec72..280de58 100644 --- a/asm/operators.h +++ b/asm/operators.h @@ -8,3 +8,5 @@ std::vector<uint8_t> operator+(std::vector<uint8_t> a, const std::vector<uint8_t>& b); std::vector<uint8_t> operator+(std::vector<uint8_t> a, const uint8_t& b); +std::vector<uint8_t> operator+=(std::vector<uint8_t>& a, const std::vector<uint8_t>& b); +std::vector<uint8_t> operator+=(std::vector<uint8_t>& a, const uint8_t& b); diff --git a/asm/segment.cpp b/asm/segment.cpp index d3050bb..9d439fd 100644 --- a/asm/segment.cpp +++ b/asm/segment.cpp @@ -9,6 +9,11 @@ using namespace std::string_literals; +void Segment::append(const std::vector<std::shared_ptr<Chunk>>& list) +{ + insert(end(), list.cbegin(), list.cend()); +} + size_t Segment::getAddressOfLabel(const std::string& label) { size_t address{0}; diff --git a/asm/segment.h b/asm/segment.h index 97e1670..b4b31f8 100644 --- a/asm/segment.h +++ b/asm/segment.h @@ -10,6 +10,7 @@ class Segment: public std::vector<std::shared_ptr<Chunk>> { public: + void append(const std::vector<std::shared_ptr<Chunk>>& list); size_t getAddressOfLabel(const std::string& label); size_t getAddressOfIndex(size_t index); std::vector<uint8_t> getCode(); diff --git a/flowgraph/node.cpp b/flowgraph/node.cpp index e0912dc..2d757f9 100644 --- a/flowgraph/node.cpp +++ b/flowgraph/node.cpp @@ -4,6 +4,8 @@ #include <boost/endian/conversion.hpp> +#include <memory> + using namespace FlowGraph; FlowGraph::Data& Node::destination() @@ -19,22 +21,28 @@ Data FlowGraph::MakeConstantInt(int i) { std::vector<uint8_t> value(size_t(4), uint8_t(0)); *(reinterpret_cast<int32_t*>(value.data())) = boost::endian::native_to_little(static_cast<int32_t>(i)); - return Data(DataType::Int, std::make_shared<Constant>(value)); + return Data{DataType::Int, std::make_shared<Constant>(value)}; } Data FlowGraph::MakeLocalPointer(FlowGraph::LocalScope& scope, const std::string& name) { - return Data(DataType::Pointer, std::make_shared<LocalStorage>(scope, name)); + Data data{DataType::Pointer, std::make_shared<LocalStorage>(scope, name)}; + scope.push_back(std::make_shared<Data>(data)); + return data; } Data FlowGraph::MakeLocalSize(FlowGraph::LocalScope& scope, const std::string& name) { - return Data(DataType::Size, std::make_shared<LocalStorage>(scope, name)); + Data data{DataType::Size, std::make_shared<LocalStorage>(scope, name)}; + scope.push_back(std::make_shared<Data>(data)); + return data; } Data FlowGraph::MakeTemporaryInt(FlowGraph::LocalScope& scope) { - return Data(DataType::Int, std::make_shared<TemporaryStorage>(scope)); + Data data{DataType::Int, std::make_shared<TemporaryStorage>(scope)}; + scope.push_back(std::make_shared<Data>(data)); + return data; } LocalScope& CreateScopeOp::scope() diff --git a/flowgraph/scope.cpp b/flowgraph/scope.cpp index 6c2e30c..54a3cca 100644 --- a/flowgraph/scope.cpp +++ b/flowgraph/scope.cpp @@ -12,16 +12,14 @@ void FlowGraph::LocalScope::append(const FlowGraph::LocalScope& other) m_variables.insert(m_variables.end(), other.m_variables.begin(), other.m_variables.end()); } -index_t FlowGraph::LocalScope::indexOfStorage(const TemporaryStorage& storage) const +index_t FlowGraph::LocalScope::indexOfStorage(const Storage& storage) const { + std::cout << "DEBUG: " << m_variables.size() << std::endl; for (index_t i = 0; i < m_variables.size(); i++) { FlowGraph::Storage& i_storage {*(m_variables[i]->storage())}; - if (typeid(i_storage) == typeid(FlowGraph::TemporaryStorage)) { - FlowGraph::TemporaryStorage& temporaryStorage{dynamic_cast<FlowGraph::TemporaryStorage&>(i_storage)}; - if (&temporaryStorage == &storage) // compare addresses - return i; - } + if (&i_storage == &storage) // compare addresses + return i; } throw std::runtime_error("ICE: Storage not found"); diff --git a/flowgraph/scope.h b/flowgraph/scope.h index 50003f4..65898cf 100644 --- a/flowgraph/scope.h +++ b/flowgraph/scope.h @@ -10,7 +10,7 @@ namespace FlowGraph { - class TemporaryStorage; ///< Forward declaration + class Storage; ///< Forward declaration // Provide a context for local temporaries name generation class LocalScope @@ -20,7 +20,7 @@ namespace FlowGraph { void push_back(std::shared_ptr<Data> data); void append(const LocalScope& other); - index_t indexOfStorage(const TemporaryStorage& storage) const; + index_t indexOfStorage(const Storage& storage) const; private: std::vector<std::shared_ptr<Data>> m_variables; diff --git a/flowgraph/storage.cpp b/flowgraph/storage.cpp index 7e502de..e9577d6 100644 --- a/flowgraph/storage.cpp +++ b/flowgraph/storage.cpp @@ -11,3 +11,13 @@ std::string FlowGraph::TemporaryStorage::name() const { return "__local_"s + std::to_string(m_scope.indexOfStorage(*this)); } + +index_t FlowGraph::TemporaryStorage::indexOfStorage() const +{ + return m_scope.indexOfStorage(*this); +} + +index_t FlowGraph::LocalStorage::indexOfStorage() const +{ + return m_scope.indexOfStorage(*this); +} diff --git a/flowgraph/storage.h b/flowgraph/storage.h index 7f648b0..27c201e 100644 --- a/flowgraph/storage.h +++ b/flowgraph/storage.h @@ -42,10 +42,12 @@ namespace FlowGraph { class LocalStorage : public Storage { public: - LocalStorage(LocalScope& scope, const std::string& name): m_name(name) {} + LocalStorage(LocalScope& scope, const std::string& name): m_name(name), m_scope(scope) {} const std::string& name() const { return m_name; } + index_t indexOfStorage() const; private: std::string m_name; + LocalScope& m_scope; }; // intermediate results, anonymous values @@ -55,6 +57,7 @@ namespace FlowGraph { public: TemporaryStorage(LocalScope& scope); std::string name() const; + index_t indexOfStorage() const; private: LocalScope& m_scope; }; @@ -4,6 +4,7 @@ #include "minicc.h" #include <boost/algorithm/string.hpp> +#include <boost/endian/conversion.hpp> #include <algorithm> #include <cctype> @@ -65,3 +66,15 @@ std::string demangle(const std::type_info& type) return boost::core::demangle(type.name()); } +std::vector<uint8_t> to_little_endian(uint32_t value) +{ + std::vector<uint8_t> result(size_t(4)); + *(reinterpret_cast<uint32_t*>(result.data())) = boost::endian::native_to_little(value); + return result; +} + +uint32_t from_little_endian(const std::vector<uint8_t>& value) +{ + return boost::endian::little_to_native(*(reinterpret_cast<const uint32_t*>(value.data()))); +} + @@ -51,3 +51,6 @@ struct PairHashSS { }; std::string demangle(const std::type_info& type); + +std::vector<uint8_t> to_little_endian(uint32_t value); +uint32_t from_little_endian(const std::vector<uint8_t>& value); |