#include "simulator.h" #include #include #include #define ENABLE_DRAM_STALLS #define DRAM_LATENCY 24 #define DRAM_RQ_SIZE 16 #define DRAM_STALLS_MODULO 16 #define VL_WDATA_GETW(lwp, i, n, w) \ VL_SEL_IWII(0, n * w, 0, 0, lwp, i * w, w) uint64_t timestamp = 0; double sc_time_stamp() { return timestamp; } Simulator::Simulator() { // force random values for unitialized signals Verilated::randReset(2); Verilated::randSeed(50); // Turn off assertion before reset Verilated::assertOn(false); ram_ = nullptr; vortex_ = new VVortex(); #ifdef VCD_OUTPUT Verilated::traceEverOn(true); trace_ = new VerilatedVcdC(); vortex_->trace(trace_, 99); trace_->open("trace.vcd"); #endif // reset the device this->reset(); } Simulator::~Simulator() { for (auto& buf : print_bufs_) { auto str = buf.second.str(); if (str.size()) { std::cout << "#" << buf.first << ": " << buf.second.str() << std::endl; } } #ifdef VCD_OUTPUT trace_->close(); #endif delete vortex_; } void Simulator::attach_ram(RAM* ram) { ram_ = ram; dram_rsp_vec_.clear(); } void Simulator::reset() { print_bufs_.clear(); dram_rsp_vec_.clear(); dram_rsp_active_ = false; snp_req_active_ = false; csr_req_active_ = false; snp_req_size_ = 0; pending_snp_reqs_ = 0; csr_rsp_value_ = nullptr; vortex_->dram_rsp_valid = 0; vortex_->dram_req_ready = 0; vortex_->io_req_ready = 0; vortex_->io_rsp_valid = 0; vortex_->snp_req_valid = 0; vortex_->snp_rsp_ready = 0; vortex_->csr_io_req_valid = 0; vortex_->csr_io_rsp_ready = 0; vortex_->reset = 1; vortex_->clk = 0; this->eval(); vortex_->clk = 1; this->eval(); vortex_->reset = 0; // Turn on assertion after reset Verilated::assertOn(true); } void Simulator::step() { vortex_->clk = 0; this->eval(); dram_rsp_ready_ = vortex_->dram_rsp_ready; snp_req_ready_ = vortex_->snp_req_ready; csr_io_req_ready_ = vortex_->csr_io_req_ready; vortex_->clk = 1; this->eval(); this->eval_dram_bus(); this->eval_io_bus(); this->eval_csr_bus(); this->eval_snp_bus(); #ifndef NDEBUG fflush(stdout); #endif } void Simulator::eval() { vortex_->eval(); #ifdef VCD_OUTPUT trace_->dump(timestamp); #endif ++timestamp; } void Simulator::eval_dram_bus() { if (ram_ == nullptr) { vortex_->dram_req_ready = 0; return; } // update DRAM responses schedule for (auto& rsp : dram_rsp_vec_) { if (rsp.cycles_left > 0) rsp.cycles_left -= 1; } // schedule DRAM responses in FIFO order std::list::iterator dram_rsp_it(dram_rsp_vec_.end()); if (!dram_rsp_vec_.empty() && (0 == dram_rsp_vec_.begin()->cycles_left)) { dram_rsp_it = dram_rsp_vec_.begin(); } // send DRAM response if (dram_rsp_active_ && vortex_->dram_rsp_valid && dram_rsp_ready_) { dram_rsp_active_ = false; } if (!dram_rsp_active_) { if (dram_rsp_it != dram_rsp_vec_.end()) { vortex_->dram_rsp_valid = 1; memcpy((uint8_t*)vortex_->dram_rsp_data, dram_rsp_it->block.data(), GLOBAL_BLOCK_SIZE); vortex_->dram_rsp_tag = dram_rsp_it->tag; dram_rsp_vec_.erase(dram_rsp_it); dram_rsp_active_ = true; } else { vortex_->dram_rsp_valid = 0; } } // handle DRAM stalls bool dram_stalled = false; #ifdef ENABLE_DRAM_STALLS if (0 == ((timestamp/2) % DRAM_STALLS_MODULO)) { dram_stalled = true; } else if (dram_rsp_vec_.size() >= DRAM_RQ_SIZE) { dram_stalled = true; } #endif // process DRAM requests if (!dram_stalled) { if (vortex_->dram_req_valid) { if (vortex_->dram_req_rw) { uint64_t byteen = vortex_->dram_req_byteen; unsigned base_addr = (vortex_->dram_req_addr * GLOBAL_BLOCK_SIZE); uint8_t* data = (uint8_t*)(vortex_->dram_req_data); for (int i = 0; i < GLOBAL_BLOCK_SIZE; i++) { if ((byteen >> i) & 0x1) { (*ram_)[base_addr + i] = data[i]; } } } else { dram_req_t dram_req; dram_req.tag = vortex_->dram_req_tag; dram_req.addr = vortex_->dram_req_addr; ram_->read(vortex_->dram_req_addr * GLOBAL_BLOCK_SIZE, GLOBAL_BLOCK_SIZE, dram_req.block.data()); dram_req.cycles_left = DRAM_LATENCY; for (auto& rsp : dram_rsp_vec_) { if (dram_req.addr == rsp.addr) { dram_req.cycles_left = rsp.cycles_left; break; } } dram_rsp_vec_.emplace_back(dram_req); } } } vortex_->dram_req_ready = !dram_stalled; } void Simulator::eval_io_bus() { for (int i = 0; i < NUM_THREADS; ++i) { if (((vortex_->io_req_valid >> i) & 0x1) && ((VL_WDATA_GETW(vortex_->io_req_addr, i, NUM_THREADS, 30) << 2) == IO_BUS_ADDR_COUT)) { assert(vortex_->io_req_rw); int data = vortex_->io_req_data[i]; int tid = data >> 16; char c = data & 0xff; auto& ss_buf = print_bufs_[tid]; ss_buf << c; if (c == '\n') { std::cout << std::dec << "#" << tid << ": " << ss_buf.str() << std::flush; ss_buf.str(""); } } } vortex_->io_req_ready = 1; vortex_->io_rsp_valid = 0; } void Simulator::eval_snp_bus() { if (snp_req_active_) { if (vortex_->snp_req_valid && snp_req_ready_) { assert(snp_req_size_); #ifdef DBG_PRINT_CACHE_SNP std::cout << std::dec << timestamp << ": [sim] SNP Req: addr=" << std::hex << vortex_->snp_req_addr << " tag=" << vortex_->snp_req_tag << " remain=" << (snp_req_size_-1) << std::endl; #endif ++vortex_->snp_req_addr; ++vortex_->snp_req_tag; ++pending_snp_reqs_; --snp_req_size_; if (0 == snp_req_size_) { vortex_->snp_req_valid = false; } } if (vortex_->snp_rsp_valid && vortex_->snp_rsp_ready) { assert(pending_snp_reqs_ > 0); --pending_snp_reqs_; if (!vortex_->snp_req_valid && 0 == pending_snp_reqs_) { vortex_->snp_rsp_ready = false; snp_req_active_ = false; } #ifdef DBG_PRINT_CACHE_SNP std::cout << std::dec << timestamp << ": [sim] SNP Rsp: tag=" << std::hex << vortex_->snp_rsp_tag << " pending=" << pending_snp_reqs_ << std::endl; #endif } } else { vortex_->snp_req_valid = 0; vortex_->snp_rsp_ready = 0; } } void Simulator::eval_csr_bus() { if (csr_req_active_) { if (vortex_->csr_io_req_valid && csr_io_req_ready_) { #ifndef NDEBUG if (vortex_->csr_io_req_rw) std::cout << std::dec << timestamp << ": [sim] CSR Wr Req: core=" << (int)vortex_->csr_io_req_coreid << ", addr=" << std::hex << vortex_->csr_io_req_addr << ", value=" << vortex_->csr_io_req_data << std::endl; else std::cout << std::dec << timestamp << ": [sim] CSR Rd Req: core=" << (int)vortex_->csr_io_req_coreid << ", addr=" << std::hex << vortex_->csr_io_req_addr << std::endl; #endif vortex_->csr_io_req_valid = 0; if (vortex_->csr_io_req_rw) csr_req_active_ = false; } if (vortex_->csr_io_rsp_valid && vortex_->csr_io_rsp_ready) { *csr_rsp_value_ = vortex_->csr_io_rsp_data; vortex_->csr_io_rsp_ready = 0; csr_req_active_ = false; #ifndef NDEBUG std::cout << std::dec << timestamp << ": [sim] CSR Rsp: value=" << vortex_->csr_io_rsp_data << std::endl; #endif } } else { vortex_->csr_io_req_valid = 0; vortex_->csr_io_rsp_ready = 0; } } void Simulator::wait(uint32_t cycles) { for (int i = 0; i < cycles; ++i) { this->step(); } } bool Simulator::is_busy() const { return vortex_->busy; } bool Simulator::snp_req_active() const { return snp_req_active_; } bool Simulator::csr_req_active() const { return csr_req_active_; } void Simulator::flush_caches(uint32_t mem_addr, uint32_t size) { if (0 == size) return; assert(!vortex_->snp_rsp_valid); vortex_->snp_req_addr = mem_addr / GLOBAL_BLOCK_SIZE; vortex_->snp_req_tag = 0; vortex_->snp_req_valid = 1; vortex_->snp_rsp_ready = 1; snp_req_size_ = (size + GLOBAL_BLOCK_SIZE - 1) / GLOBAL_BLOCK_SIZE; pending_snp_reqs_ = 0; snp_req_active_ = true; } void Simulator::set_csr(int core_id, int addr, unsigned value) { vortex_->csr_io_req_valid = 1; vortex_->csr_io_req_coreid = core_id; vortex_->csr_io_req_addr = addr; vortex_->csr_io_req_rw = 1; vortex_->csr_io_req_data = value; vortex_->csr_io_rsp_ready = 0; csr_req_active_ = true; } void Simulator::get_csr(int core_id, int addr, unsigned *value) { vortex_->csr_io_req_valid = 1; vortex_->csr_io_req_coreid = core_id; vortex_->csr_io_req_addr = addr; vortex_->csr_io_req_rw = 0; vortex_->csr_io_rsp_ready = 1; csr_rsp_value_ = value; csr_req_active_ = true; } void Simulator::run() { #ifndef NDEBUG std::cout << std::dec << timestamp << ": [sim] run()" << std::endl; #endif // execute program while (vortex_->busy && !vortex_->ebreak) { this->step(); } // wait 5 cycles to flush the pipeline this->wait(5); } int Simulator::get_last_wb_value(int reg) const { return (int)vortex_->Vortex->genblk1__BRA__0__KET____DOT__cluster->genblk1__BRA__0__KET____DOT__core->pipeline->commit->writeback->last_wb_value[reg]; } void Simulator::load_bin(const char* program_file) { if (ram_ == nullptr) return; std::ifstream ifs(program_file); if (!ifs) { std::cout << "error: " << program_file << " not found" << std::endl; } ifs.seekg(0, ifs.end); auto size = ifs.tellg(); std::vector content(size); ifs.seekg(0, ifs.beg); ifs.read((char*)content.data(), size); ram_->write(STARTUP_ADDR, size, content.data()); } void Simulator::load_ihex(const char* program_file) { if (ram_ == nullptr) return; auto hti = [&](char c)->uint32_t { if (c >= 'A' && c <= 'F') return c - 'A' + 10; if (c >= 'a' && c <= 'f') return c - 'a' + 10; return c - '0'; }; auto hToI = [&](const char *c, uint32_t size)->uint32_t { uint32_t value = 0; for (uint32_t i = 0; i < size; i++) { value += hti(c[i]) << ((size - i - 1) * 4); } return value; }; std::ifstream ifs(program_file); if (!ifs) { std::cout << "error: " << program_file << " not found" << std::endl; } ifs.seekg(0, ifs.end); uint32_t size = ifs.tellg(); std::vector content(size); ifs.seekg(0, ifs.beg); ifs.read(content.data(), size); int offset = 0; char *line = content.data(); while (true) { if (line[0] == ':') { uint32_t byteCount = hToI(line + 1, 2); uint32_t nextAddr = hToI(line + 3, 4) + offset; uint32_t key = hToI(line + 7, 2); switch (key) { case 0: for (uint32_t i = 0; i < byteCount; i++) { (*ram_)[nextAddr + i] = hToI(line + 9 + i * 2, 2); } break; case 2: offset = hToI(line + 9, 4) << 4; break; case 4: offset = hToI(line + 9, 4) << 16; break; default: break; } } while (*line != '\n' && size != 0) { ++line; --size; } if (size <= 1) break; ++line; --size; } } void Simulator::print_stats(std::ostream& out) { out << std::left; out << std::setw(24) << "# of total cycles:" << std::dec << timestamp/2 << std::endl; }