rve/src/vm.cpp

297 lines
11 KiB
C++
Raw Normal View History

#include "vm.hpp"
#include <cstdint>
#include <cstring>
2024-12-09 20:17:21 +00:00
#include <fstream>
#include <iostream>
#include <stdexcept>
#include <vector>
inline int32_t sign_extend(int32_t value, int bits) {
int32_t mask = 1 << (bits - 1);
return (value ^ mask) - mask;
}
2024-12-09 20:17:21 +00:00
VM::VM(std::vector<uint8_t> memory) : memory_(memory) {}
2024-12-09 00:29:19 +00:00
std::vector<uint8_t> VM::read_memory(size_t start, size_t size) {
2024-12-09 20:17:21 +00:00
if (start + size > memory_.size()) {
return std::vector<uint8_t>(size, 0);
}
2024-12-09 00:29:19 +00:00
return std::vector<uint8_t>(memory_.begin() + start,
memory_.begin() + start + size);
}
2024-12-09 21:21:47 +00:00
uint32_t VM::read_memory_word(size_t pos) { return *(uint32_t*)&memory_[pos]; }
void VM::write_memory_word(size_t pos, uint32_t value) {
*(uint32_t*)&memory_[pos] = value;
}
uint32_t VM::read_register(size_t regnum) {
2024-12-09 20:17:21 +00:00
if (regnum == 32) return pc;
if (regnum >= NUM_REGISTERS) {
throw std::runtime_error("Register out of range");
}
return registers[regnum];
}
2024-12-09 20:17:21 +00:00
void VM::step() {
2024-12-09 00:29:19 +00:00
size_t memory_size = memory_.size();
2024-12-09 20:17:21 +00:00
uint8_t* memory = &memory_[0];
2024-12-09 00:29:19 +00:00
2024-12-09 20:17:21 +00:00
uint32_t instr = *(uint32_t*)&memory[pc];
// std::cout << "pc: " << std::hex << pc << std::dec << "\n";
// std::cout << "instr: " << std::hex << instr << "\n";
pc += 4;
2024-12-09 20:17:21 +00:00
// Decode instruction
uint32_t opcode = instr & 0x7F;
uint32_t rd = (instr >> 7) & 0x1F;
uint32_t funct3 = (instr >> 12) & 0x7;
uint32_t rs1 = (instr >> 15) & 0x1F;
uint32_t rs2 = (instr >> 20) & 0x1F;
uint32_t funct7 = (instr >> 25);
int32_t imm;
2024-12-09 20:17:21 +00:00
switch (opcode) {
case 0x33: { // R-type
2024-12-06 21:58:16 +00:00
if (funct7 == 0x00) {
2024-12-09 20:17:21 +00:00
if (funct3 == 0x0) { // ADD
2024-12-06 21:58:16 +00:00
registers[rd] = registers[rs1] + registers[rs2];
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x04) { // XOR
2024-12-06 21:58:16 +00:00
registers[rd] = registers[rs1] ^ registers[rs2];
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x06) { // OR
2024-12-06 21:58:16 +00:00
registers[rd] = registers[rs1] | registers[rs2];
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x07) { // AND
2024-12-06 21:58:16 +00:00
registers[rd] = registers[rs1] & registers[rs2];
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x01) { // SLL
2024-12-06 21:58:16 +00:00
registers[rd] = registers[rs1] << registers[rs2];
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x05) { // SRL
2024-12-06 21:58:16 +00:00
uint32_t value = registers[rs1];
uint32_t shift_amount = registers[rs2] & 0x1F;
registers[rd] = value << shift_amount;
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x02) { // SLT
registers[rd] = (static_cast<int32_t>(registers[rs1]) <
static_cast<int32_t>(registers[rs2]))
? 0
: 1;
} else if (funct3 == 0x03) { // SLTU
2024-12-06 21:58:16 +00:00
registers[rd] = (registers[rs1] < registers[rs2]) ? 1 : 0;
} else {
throw std::runtime_error("Unknown R-type instruction");
}
2024-12-06 21:58:16 +00:00
} else if (funct7 == 0x20) {
2024-12-09 20:17:21 +00:00
if (funct3 == 0x0) { // SUB
2024-12-06 21:58:16 +00:00
registers[rd] = registers[rs1] - registers[rs2];
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x05) { // SRA
2024-12-06 21:58:16 +00:00
// Only the lower 5 bits are used for shift
int32_t value = static_cast<int32_t>(registers[rs1]);
int32_t shift_amount = registers[rs2] & 0x1F;
registers[rd] = value >> shift_amount;
} else {
throw std::runtime_error("Unknown R-type instruction");
}
} else if (funct7 == 0x01) {
2024-12-09 20:17:21 +00:00
if (funct3 == 0x0) { // MUL
int64_t result =
static_cast<int64_t>(static_cast<int32_t>(registers[rs1])) *
static_cast<int64_t>(static_cast<int32_t>(registers[rs2]));
2024-12-06 21:58:16 +00:00
registers[rd] = static_cast<uint32_t>(result);
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x1) { // MULH
int64_t result =
static_cast<int64_t>(static_cast<int32_t>(registers[rs1])) *
static_cast<int64_t>(static_cast<int32_t>(registers[rs2]));
2024-12-06 21:58:16 +00:00
registers[rd] = static_cast<uint32_t>(result >> 32);
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x2) { // MULSU
int64_t result =
static_cast<int64_t>(static_cast<int32_t>(registers[rs1])) *
static_cast<uint64_t>(registers[rs2]);
2024-12-06 21:58:16 +00:00
registers[rd] = static_cast<uint32_t>(result >> 32);
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x3) { // MULU
2024-12-06 21:58:16 +00:00
uint64_t result = static_cast<uint64_t>(registers[rs1]) *
2024-12-09 20:17:21 +00:00
static_cast<uint64_t>(registers[rs2]);
registers[rd] = static_cast<uint32_t>(result >> 32); // Upper 32 bits
} else if (funct3 == 0x4) { // DIV
2024-12-06 21:58:16 +00:00
int32_t dividend = static_cast<int32_t>(registers[rs1]);
int32_t divisor = static_cast<int32_t>(registers[rs2]);
if (divisor == 0) {
2024-12-09 20:17:21 +00:00
registers[rd] = -1; // Division by zero result
2024-12-06 21:58:16 +00:00
} else if (dividend == INT32_MIN && divisor == -1) {
2024-12-09 20:17:21 +00:00
registers[rd] = dividend; // Overflow case
2024-12-06 21:58:16 +00:00
} else {
registers[rd] = dividend / divisor;
}
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x5) { // DIVU
2024-12-06 21:58:16 +00:00
uint32_t dividend = registers[rs1];
uint32_t divisor = registers[rs2];
registers[rd] = (divisor == 0) ? UINT32_MAX : dividend / divisor;
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x6) { // REM
2024-12-06 21:58:16 +00:00
int32_t dividend = static_cast<int32_t>(registers[rs1]);
int32_t divisor = static_cast<int32_t>(registers[rs2]);
if (divisor == 0) {
2024-12-09 20:17:21 +00:00
registers[rd] =
dividend; // Remainder with zero divisor is the dividend
2024-12-06 21:58:16 +00:00
} else if (dividend == INT32_MIN && divisor == -1) {
2024-12-09 20:17:21 +00:00
registers[rd] = 0; // Overflow case
2024-12-06 21:58:16 +00:00
} else {
registers[rd] = dividend % divisor;
}
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x7) { // REMU
2024-12-06 21:58:16 +00:00
uint32_t dividend = registers[rs1];
uint32_t divisor = registers[rs2];
registers[rd] = (divisor == 0) ? dividend : dividend % divisor;
} else {
throw std::runtime_error("Unknown R-type instruction");
}
} else {
throw std::runtime_error("Unknown R-type instruction");
}
break;
}
2024-12-09 20:17:21 +00:00
case 0x13: { // I-type (ADDI)
imm = sign_extend(instr >> 20, 12); // Extract 12-bit immediate
if (funct3 == 0x0) { // ADDI
2024-12-06 21:58:16 +00:00
registers[rd] = registers[rs1] + imm;
} else {
throw std::runtime_error("Unknown I-type instruction");
}
break;
}
2024-12-09 20:17:21 +00:00
case 0x63: { // B-type (branches)
2024-12-06 21:58:16 +00:00
imm = ((instr >> 7) & 0x1E) | ((instr >> 20) & 0x7E0) |
2024-12-09 20:17:21 +00:00
((instr >> 19) & 0x800) | ((instr >> 31) << 12);
imm = sign_extend(imm, 13); // Sign-extend 13-bit immediate
if (funct3 == 0x0) { // BEQ
2024-12-06 21:58:16 +00:00
if (registers[rs1] == registers[rs2]) {
2024-12-09 20:17:21 +00:00
pc += imm - 4; // Offset PC (adjust for pre-increment)
2024-12-06 21:58:16 +00:00
}
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x1) { // BNE
2024-12-06 21:58:16 +00:00
if (registers[rs1] != registers[rs2]) {
2024-12-09 20:17:21 +00:00
pc += imm - 4; // Offset PC
2024-12-06 21:58:16 +00:00
}
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x4) { // BLT
2024-12-06 21:58:16 +00:00
if (static_cast<int32_t>(registers[rs1]) <
static_cast<int32_t>(registers[rs2])) {
pc += imm - 4;
}
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x5) { // BGE
2024-12-06 21:58:16 +00:00
if (static_cast<int32_t>(registers[rs1]) >=
static_cast<int32_t>(registers[rs2])) {
pc += imm - 4;
}
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x6) { // BLTU
2024-12-06 21:58:16 +00:00
if (registers[rs1] < registers[rs2]) pc += imm - 4;
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x7) { // BGEU
2024-12-06 21:58:16 +00:00
if (registers[rs1] >= registers[rs2]) pc += imm - 4;
} else {
throw std::runtime_error("Unknown B-type instruction");
}
break;
}
2024-12-09 20:17:21 +00:00
case 0x03: { // I-type (loads)
imm = sign_extend(instr >> 20, 12); // Extract 12-bit immediate
if (funct3 == 0x00) { // LB
2024-12-06 21:58:16 +00:00
uint32_t addr = registers[rs1] + imm;
if (addr + 1 > memory_size) {
throw std::runtime_error("Memory access out of bounds");
}
registers[rd] = 0;
2024-12-06 21:58:16 +00:00
std::memcpy(&registers[rd], memory + addr, sizeof(uint8_t));
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x01) { // LH
2024-12-06 21:58:16 +00:00
uint32_t addr = registers[rs1] + imm;
if (addr + 2 > memory_size) {
throw std::runtime_error("Memory access out of bounds");
}
registers[rd] = 0;
2024-12-06 21:58:16 +00:00
std::memcpy(&registers[rd], memory + addr, sizeof(uint16_t));
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x2) { // LW
2024-12-06 21:58:16 +00:00
uint32_t addr = registers[rs1] + imm;
if (addr + 4 > memory_size) {
throw std::runtime_error("Memory access out of bounds");
}
std::memcpy(&registers[rd], memory + addr, sizeof(uint32_t));
} else {
throw std::runtime_error("Unknown load instruction");
}
break;
}
2024-12-09 20:17:21 +00:00
case 0x23: { // S-type (SW)
imm = ((instr >> 7) & 0x1F) | (((instr >> 25) & 0x7F) << 5);
2024-12-09 20:17:21 +00:00
imm = sign_extend(imm, 12); // Sign-extend 12-bit immediate
if (funct3 == 0x0) { // SB
2024-12-06 21:58:16 +00:00
uint32_t addr = registers[rs1] + imm;
if (addr + 1 > memory_size) {
throw std::runtime_error("Memory access out of bounds");
}
std::memcpy(memory + addr, &registers[rs2], sizeof(uint8_t));
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x1) { // SH
2024-12-06 21:58:16 +00:00
uint32_t addr = registers[rs1] + imm;
if (addr + 2 > memory_size) {
throw std::runtime_error("Memory access out of bounds");
}
std::memcpy(memory + addr, &registers[rs2], sizeof(uint16_t));
2024-12-09 20:17:21 +00:00
} else if (funct3 == 0x2) { // SW
2024-12-06 21:58:16 +00:00
uint32_t addr = registers[rs1] + imm;
if (addr + 4 > memory_size) {
throw std::runtime_error("Memory access out of bounds");
}
std::memcpy(memory + addr, &registers[rs2], sizeof(uint32_t));
} else {
throw std::runtime_error("Unknown store instruction");
}
break;
}
2024-12-09 20:17:21 +00:00
case 0x6F: { // JAL
int32_t offset =
((instr & 0x80000000) ? 0xFFF00000
: 0) | // Sign-extension for imm[20]
((instr >> 21) & 0x3FF) << 1 | // imm[10:1]
((instr >> 20) & 0x1) << 11 | // imm[11]
((instr & 0xFF000)); // imm[19:12]
2024-12-06 21:58:16 +00:00
2024-12-09 20:17:21 +00:00
registers[rd] = pc; // Save return address
2024-12-06 21:58:16 +00:00
pc += offset - 4;
break;
}
2024-12-09 20:17:21 +00:00
case 0x67: { // JALR
int32_t offset = (instr >> 20); // Sign-extended 12-bit immediate
uint32_t target =
(registers[rs1] + offset) & ~1; // Target address (LSB cleared)
2024-12-06 21:58:16 +00:00
2024-12-09 20:17:21 +00:00
registers[rd] = pc; // Save return address
pc = target;
2024-12-06 21:58:16 +00:00
break;
}
2024-12-09 20:17:21 +00:00
case 0x37: { // LUI
uint32_t imm = (instr >> 12) & 0xFFFFF; // Extract 20-bit immediate
registers[rd] =
imm
<< 12; // Shift the immediate to the upper 20 bits of the register
2024-12-06 21:58:16 +00:00
break;
}
2024-12-09 20:17:21 +00:00
case 0x17: { // AUIPC
uint32_t imm = (instr >> 12) & 0xFFFFF; // Extract 20-bit immediate
registers[rd] =
pc +
(imm << 12); // Add the immediate (shifted left) to the current PC
2024-12-06 21:58:16 +00:00
break;
}
2024-12-09 21:21:47 +00:00
case 0x73: { // EBREAK
pc -= 4;
throw EbreakException();
2024-12-06 23:50:21 +00:00
break;
}
2024-12-06 21:58:16 +00:00
default:
throw std::runtime_error("Unknown opcode");
2024-12-09 20:17:21 +00:00
}
}
void VM::eval() {
2024-12-09 21:21:47 +00:00
while (true) {
2024-12-09 20:17:21 +00:00
step();
2024-12-06 21:58:16 +00:00
}
}