resource-optimised-DCT/riscv_hw.py

177 lines
4.3 KiB
Python

import m5
from m5.objects import System, SrcClockDomain, VoltageDomain, Root, \
RiscvO3CPU, Cache, AddrRange, SEWorkload, Process, MemCtrl, \
DDR3_1600_8x8, SystemXBar, L2XBar, RiscvISA
class RiscvHWConfig:
def __init__(self, l1i, l1d, l2, vlen, elen, cores):
self.l1i = l1i
self.l1d = l1d
self.l2 = l2
self.vlen = vlen
self.elen = elen
self.cores = cores
def get_config():
import argparse
parser = argparse.ArgumentParser()
parser.add_argument('--l1i', type=str, default='16kB')
parser.add_argument('--l1d', type=str, default='64kB')
parser.add_argument('--l2', type=str, default='256kB')
parser.add_argument('--vlen', type=int, default=256)
parser.add_argument('--elen', type=int, default=64)
parser.add_argument('--cores', type=int, default=1)
args = parser.parse_args()
return RiscvHWConfig(args.l1i, args.l1d, args.l2,
args.vlen, args.elen, args.cores)
class L1Cache(Cache):
assoc = 2
tag_latency = 2
data_latency = 2
response_latency = 2
mshrs = 4
tgts_per_mshr = 20
def __init__(self, config=None):
super().__init__()
pass
def connectCPU(self, cpu):
raise NotImplementedError
def connectBus(self, bus):
self.mem_side = bus.cpu_side_ports
class L1ICache(L1Cache):
size = '16kB'
def __init__(self, config=None):
super().__init__(config)
if not config or not config.l1i:
return
self.size = config.l1i
def connectCPU(self, cpu):
self.cpu_side = cpu.icache_port
class L1DCache(L1Cache):
size = '64kB'
def __init__(self, config=None):
super().__init__(config)
if not config or not config.l1d:
return
self.size = config.l1d
def connectCPU(self, cpu):
self.cpu_side = cpu.dcache_port
class L2Cache(Cache):
size = '256kB'
assoc = 8
tag_latency = 20
data_latency = 20
response_latency = 20
mshrs = 20
tgts_per_mshr = 12
def __init__(self, config=None):
super().__init__()
if not config or not config.l2:
return
self.size = config.l2
def connectCPUSideBus(self, bus):
self.cpu_side = bus.mem_side_ports
def connectMemSideBus(self, bus):
self.mem_side = bus.cpu_side_ports
def createCPU(l2bus, config):
cpu = RiscvO3CPU()
cpu.isa = RiscvISA(enable_rvv=True, vlen=config.vlen, elen=config.elen)
cpu.icache = L1ICache(config)
cpu.dcache = L1DCache(config)
cpu.icache.connectCPU(cpu)
cpu.dcache.connectCPU(cpu)
cpu.icache.connectBus(l2bus)
cpu.dcache.connectBus(l2bus)
cpu.createInterruptController()
return cpu
config = get_config()
print(f"l1i size: {config.l1i}")
print(f"l1d size: {config.l1d}")
print(f"l2 size: {config.l2}")
print(f"vlen size: {config.vlen} bits")
print(f"elen size: {config.elen} bits")
print(f"cores: {config.cores}")
print("\n")
assert config.vlen >= 2 * config.elen, \
"ERROR: vlen must be at least twice as large as elen"
assert 128 <= config.vlen <= 4096, \
"ERROR: vlen must be between 128 and 4096 bits"
assert config.vlen & (config.vlen - 1) == 0, \
"ERROR: vlen must be a power of 2"
assert config.elen in [16, 32, 64], \
"ERROR: elen must be 16, 32 or 64"
system = System()
system.clk_domain = SrcClockDomain()
system.clk_domain.clock = '1GHz'
system.clk_domain.voltage_domain = VoltageDomain()
system.mem_mode = 'timing'
system.mem_ranges = [AddrRange('512MB')]
system.l2bus = L2XBar()
system.cpu = [createCPU(system.l2bus, config) for _ in range(config.cores)]
system.l2cache = L2Cache(config)
system.l2cache.connectCPUSideBus(system.l2bus)
system.membus = SystemXBar()
system.l2cache.connectMemSideBus(system.membus)
system.mem_ctrl = MemCtrl()
system.mem_ctrl.dram = DDR3_1600_8x8()
system.mem_ctrl.dram.range = system.mem_ranges[0]
system.mem_ctrl.port = system.membus.mem_side_ports
binary = './dct2d_riscv.out'
system.workload = SEWorkload.init_compatible(binary)
process = Process()
process.cmd = [binary]
for cpu in system.cpu:
cpu.workload = process
cpu.createThreads()
# Run SE mode
root = Root(full_system=False, system=system)
m5.instantiate()
print("Beginning simulation!")
exit_event = m5.simulate()
print(f"Exiting @ tick {m5.curTick()} because {exit_event.getCause()}")