Skip to content

Commit

Permalink
[wip] migrate T1 to FixedIOModule
Browse files Browse the repository at this point in the history
  • Loading branch information
sequencer committed Jul 20, 2024
1 parent b4f6d25 commit f89a4d4
Show file tree
Hide file tree
Showing 2 changed files with 269 additions and 216 deletions.
335 changes: 187 additions & 148 deletions ipemu/src/TestBench.scala
Original file line number Diff line number Diff line change
Expand Up @@ -23,16 +23,21 @@ class TestBenchOM extends Class {
t1 := t1In
}

class TestBench(generator: SerializableModuleGenerator[T1, T1Parameter]) extends RawModule {
class TestBench(generator: SerializableModuleGenerator[T1, T1Parameter])
extends RawModule
with ImplicitClock
with ImplicitReset {
val omInstance: Instance[TestBenchOM] = Instantiate(new TestBenchOM)
val omType: ClassType = omInstance.toDefinition.getClassType
val omType: ClassType = omInstance.toDefinition.getClassType
@public
val om: Property[ClassType] = IO(Output(Property[omType.Type]()))
om := omInstance.getPropertyReference

val clockGen = Module(new ExtModule with HasExtModuleInline {
lazy val clockGen = Module(new ExtModule with HasExtModuleInline {

override def desiredName = "ClockGen"
setInline(s"$desiredName.sv",
setInline(
s"$desiredName.sv",
s"""module $desiredName(output reg clock, output reg reset);
| export "DPI-C" function dump_wave;
| function dump_wave(input string file);
Expand All @@ -54,186 +59,220 @@ class TestBench(generator: SerializableModuleGenerator[T1, T1Parameter]) extends
val clock = IO(Output(Bool()))
val reset = IO(Output(Bool()))
})
def clock = clockGen.clock.asClock
def reset = clockGen.reset
override def implicitClock = clockGen.clock.asClock
override def implicitReset = clockGen.reset
val dut: Instance[T1] = generator.instance()

val clock: Clock = clockGen.clock.asClock
val reset: Bool = clockGen.reset
val simulationTime: UInt = withClockAndReset(clock, reset)(RegInit(0.U(64.W)))
val simulationTime: UInt = RegInit(0.U(64.W))
simulationTime := simulationTime + 1.U

val dut: T1 = withClockAndReset(clock, reset)(Module(generator.module()))
omInstance.t1In := Property(dut.om.asAnyClassType)
dut.io.clock := clockGen.clock.asClock
dut.io.reset := clockGen.reset
omInstance.t1In := Property(dut.io.om.asAnyClassType)
// Instruction Drivers
withClockAndReset(clock, reset) {

// TODO: this initial way cannot happen before reset...
val initFlag = RegInit(false.B)
when(!initFlag) {
initFlag := true.B
printf(cf"""{"event":"SimulationStart","cycle":${simulationTime}}\n""")
}
val watchdog = RawUnclockedNonVoidFunctionCall("cosim_watchdog", UInt(8.W))(simulationTime(9, 0) === 0.U)
when(watchdog =/= 0.U) {
stop(cf"""{"event":"SimulationStop","reason": ${watchdog},"cycle":${simulationTime}}\n""")
}
// TODO: this initial way cannot happen before reset...
val initFlag = RegInit(false.B)
when(!initFlag) {
initFlag := true.B
printf(cf"""{"event":"SimulationStart","cycle":${simulationTime}}\n""")
}
val watchdog = RawUnclockedNonVoidFunctionCall("cosim_watchdog", UInt(8.W))(simulationTime(9, 0) === 0.U)
when(watchdog =/= 0.U) {
stop(cf"""{"event":"SimulationStop","reason": ${watchdog},"cycle":${simulationTime}}\n""")
}

// uint32_t -> svBitVecVal -> reference type with 7 length.
class Issue extends Bundle {
val instruction: UInt = UInt(32.W)
val src1Data: UInt = UInt(32.W)
val src2Data: UInt = UInt(32.W)
// mstatus, vstatus?
val vtype: UInt = UInt(32.W)
val vl: UInt = UInt(32.W)
// vlenb
val vstart: UInt = UInt(32.W)
// vxrm, vxsat are merged to vcsr
val vcsr: UInt = UInt(32.W)
// meta is used to control the simulation.
// 0 is reserved, aka not valid
// 1 is normal, it's a valid instruction
// 2 is fence, it will request
// others are exit, will end the simulation immediately
val meta: UInt = UInt(32.W)
}
class Retire extends Bundle {
val rd: UInt = UInt(32.W)
val data: UInt = UInt(32.W)
val writeRd: UInt = UInt(32.W)
val vxsat: UInt = UInt(32.W)
}
val issue = WireDefault(0.U.asTypeOf(new Issue))
val fence = RegInit(false.B)
val outstanding = RegInit(0.U(4.W))
val doIssue: Bool = dut.request.ready && !fence
outstanding := outstanding + (doIssue && (issue.meta === 1.U)) - dut.response.valid
fence := Mux(doIssue, issue.meta === 2.U, fence && !dut.response.valid && !(outstanding === 0.U))

issue := RawClockedNonVoidFunctionCall("issue_vector_instruction", new Issue)(
clock,
doIssue,
)
dut.request.bits.instruction := issue.instruction
dut.request.bits.src1Data := issue.src1Data
dut.request.bits.src2Data := issue.src2Data
dut.csrInterface.vlmul := issue.vtype(2, 0)
dut.csrInterface.vSew := issue.vtype(5, 3)
dut.csrInterface.vta := issue.vtype(6)
dut.csrInterface.vma := issue.vtype(7)
dut.csrInterface.vl := issue.vl
dut.csrInterface.vStart := issue.vstart
dut.csrInterface.vxrm := issue.vcsr(2, 1)

dut.csrInterface.ignoreException := 0.U
dut.storeBufferClear := true.B
dut.request.valid := issue.meta === 1.U
when(issue.meta =/= 0.U && issue.meta =/= 1.U && issue.meta =/= 2.U) {
stop(cf"""{"event":"SimulationStop","reason": ${issue.meta},"cycle":${simulationTime}}\n""")
}
val retire = Wire(new Retire)
retire.rd := dut.response.bits.rd.bits
retire.data := dut.response.bits.data
retire.writeRd := dut.response.bits.rd.valid
retire.vxsat := dut.response.bits.vxsat
RawClockedVoidFunctionCall("retire_vector_instruction")(clock, dut.response.valid, retire)
val dummy = Wire(Bool())
dummy := false.B
RawClockedVoidFunctionCall("retire_vector_mem")(clock, dut.response.bits.mem && dut.response.valid, dummy)
// uint32_t -> svBitVecVal -> reference type with 7 length.
class Issue extends Bundle {
val instruction: UInt = UInt(32.W)
val src1Data: UInt = UInt(32.W)
val src2Data: UInt = UInt(32.W)
// mstatus, vstatus?
val vtype: UInt = UInt(32.W)
val vl: UInt = UInt(32.W)
// vlenb
val vstart: UInt = UInt(32.W)
// vxrm, vxsat are merged to vcsr
val vcsr: UInt = UInt(32.W)
// meta is used to control the simulation.
// 0 is reserved, aka not valid
// 1 is normal, it's a valid instruction
// 2 is fence, it will request
// others are exit, will end the simulation immediately
val meta: UInt = UInt(32.W)
}
class Retire extends Bundle {
val rd: UInt = UInt(32.W)
val data: UInt = UInt(32.W)
val writeRd: UInt = UInt(32.W)
val vxsat: UInt = UInt(32.W)
}
val issue = WireDefault(0.U.asTypeOf(new Issue))
val fence = RegInit(false.B)
val outstanding = RegInit(0.U(4.W))
val doIssue: Bool = dut.io.request.ready && !fence
outstanding := outstanding + (doIssue && (issue.meta === 1.U)) - dut.io.response.valid
fence := Mux(doIssue, issue.meta === 2.U, fence && !dut.io.response.valid && !(outstanding === 0.U))

issue := RawClockedNonVoidFunctionCall("issue_vector_instruction", new Issue)(
clock,
doIssue
)
dut.io.request.bits.instruction := issue.instruction
dut.io.request.bits.src1Data := issue.src1Data
dut.io.request.bits.src2Data := issue.src2Data
dut.io.csrInterface.vlmul := issue.vtype(2, 0)
dut.io.csrInterface.vSew := issue.vtype(5, 3)
dut.io.csrInterface.vta := issue.vtype(6)
dut.io.csrInterface.vma := issue.vtype(7)
dut.io.csrInterface.vl := issue.vl
dut.io.csrInterface.vStart := issue.vstart
dut.io.csrInterface.vxrm := issue.vcsr(2, 1)

dut.io.csrInterface.ignoreException := 0.U
dut.io.storeBufferClear := true.B
dut.io.request.valid := issue.meta === 1.U
when(issue.meta =/= 0.U && issue.meta =/= 1.U && issue.meta =/= 2.U) {
stop(cf"""{"event":"SimulationStop","reason": ${issue.meta},"cycle":${simulationTime}}\n""")
}
val retire = Wire(new Retire)
retire.rd := dut.io.response.bits.rd.bits
retire.data := dut.io.response.bits.data
retire.writeRd := dut.io.response.bits.rd.valid
retire.vxsat := dut.io.response.bits.vxsat
RawClockedVoidFunctionCall("retire_vector_instruction")(clock, dut.io.response.valid, retire)
val dummy = Wire(Bool())
dummy := false.B
RawClockedVoidFunctionCall("retire_vector_mem")(clock, dut.io.response.bits.mem && dut.io.response.valid, dummy)

// Memory Drivers
Seq(
dut.highBandwidthLoadStorePort,
dut.indexedLoadStorePort
).map(_.viewAs[AXI4RWIrrevocableVerilog]).lazyZip(
Seq("highBandwidthPort", "indexedAccessPort")
).zipWithIndex.foreach {
case ((bundle: AXI4RWIrrevocableVerilog, channelName: String), index: Int) =>
val agent = Module(new AXI4SlaveAgent(
AXI4SlaveAgentParameter(
name= channelName,
axiParameter = bundle.parameter,
outstanding = 4,
readPayloadSize = 1,
writePayloadSize = 1,
)
)).suggestName(s"axi4_channel${index}_${channelName}")
agent.io.channel match {
case io: AXI4RWIrrevocableVerilog => io <> bundle
}
agent.io.clock := clock
agent.io.reset := reset
agent.io.channelId := index.U
agent.io.gateRead := false.B
agent.io.gateWrite := false.B
}
dut.io.highBandwidthLoadStorePort,
dut.io.indexedLoadStorePort
).map(_.viewAs[AXI4RWIrrevocableVerilog])
.lazyZip(
Seq("highBandwidthPort", "indexedAccessPort")
)
.zipWithIndex
.foreach {
case ((bundle: AXI4RWIrrevocableVerilog, channelName: String), index: Int) =>
val agent = Module(
new AXI4SlaveAgent(
AXI4SlaveAgentParameter(
name = channelName,
axiParameter = bundle.parameter,
outstanding = 4,
readPayloadSize = 1,
writePayloadSize = 1
)
)
).suggestName(s"axi4_channel${index}_${channelName}")
agent.io.channel match {
case io: AXI4RWIrrevocableVerilog => io <> bundle
}
agent.io.clock := clock
agent.io.reset := reset
agent.io.channelId := index.U
agent.io.gateRead := false.B
agent.io.gateWrite := false.B
}

// Events for difftest and performance modeling

val laneProbes = dut.laneProbes.zipWithIndex.map{case (p, idx) =>
val wire = Wire(p.cloneType).suggestName(s"lane${idx}Probe")
wire := probe.read(p)
wire
val laneProbes = dut.io.laneProbes.zipWithIndex.map {
case (p, idx) =>
val wire = Wire(p.cloneType).suggestName(s"lane${idx}Probe")
wire := probe.read(p)
wire
}

val lsuProbe = probe.read(dut.lsuProbe).suggestName("lsuProbe")
val lsuProbe = probe.read(dut.io.lsuProbe).suggestName("lsuProbe")

val storeUnitProbe = lsuProbe.storeUnitProbe.suggestName("storeUnitProbe")

val otherUnitProbe = lsuProbe.otherUnitProbe.suggestName("otherUnitProbe")

val laneVrfProbes = dut.laneVrfProbes.zipWithIndex.map{ case (p, idx) =>
val wire = Wire(p.cloneType).suggestName(s"lane${idx}VrfProbe")
wire := probe.read(p)
wire
val laneVrfProbes = dut.io.laneVrfProbes.zipWithIndex.map {
case (p, idx) =>
val wire = Wire(p.cloneType).suggestName(s"lane${idx}VrfProbe")
wire := probe.read(p)
wire
}

val t1Probe = probe.read(dut.io.t1Probe)

// vrf write
laneVrfProbes.zipWithIndex.foreach {
case (lane, i) =>
when(lane.valid)(
printf(
cf"""{"event":"VrfWrite","issue_idx":${lane.requestInstruction},"vd":${lane.requestVd},"offset":${lane.requestOffset},"mask":"${lane.requestMask}%x","data":"${lane.requestData}%x","lane":$i,"cycle":${simulationTime}}\n"""
)
)
}
// memory write from store unit
when(storeUnitProbe.valid)(
printf(
cf"""{"event":"MemoryWrite","lsu_idx":${storeUnitProbe.index},"mask":"${storeUnitProbe.mask}%x","data":"${storeUnitProbe.data}%x","address":"${storeUnitProbe.address}%x","cycle":${simulationTime}}\n"""
)
)
// memory write from other unit
when(otherUnitProbe.valid)(
printf(
cf"""{"event":"MemoryWrite","lsu_idx":${otherUnitProbe.index},"mask":"${otherUnitProbe.mask}%x","data":"${otherUnitProbe.data}%x","address":"${otherUnitProbe.address}%x","cycle":${simulationTime}}\n"""
)
)
// issue
when(dut.io.request.fire)(
printf(cf"""{"event":"Issue","idx":${t1Probe.instructionCounter},"cycle":${simulationTime}}\n""")
)
// check rd
when(dut.io.response.bits.rd.valid)(
printf(
cf"""{"event":"CheckRd","data":"${dut.io.response.bits.data}%x","issue_idx":${t1Probe.responseCounter},"cycle":${simulationTime}}\n"""
)
)
// lsu enq
when(lsuProbe.reqEnq.orR)(printf(cf"""{"event":"LsuEnq","enq":${lsuProbe.reqEnq},"cycle":${simulationTime}}\n"""))

val t1Probe = probe.read(dut.t1Probe)

withClockAndReset(clock, reset) {
// vrf write
laneVrfProbes.zipWithIndex.foreach { case (lane, i) => when(lane.valid)(printf(cf"""{"event":"VrfWrite","issue_idx":${lane.requestInstruction},"vd":${lane.requestVd},"offset":${lane.requestOffset},"mask":"${lane.requestMask}%x","data":"${lane.requestData}%x","lane":$i,"cycle":${simulationTime}}\n""")) }
// memory write from store unit
when(storeUnitProbe.valid)(printf(cf"""{"event":"MemoryWrite","lsu_idx":${storeUnitProbe.index},"mask":"${storeUnitProbe.mask}%x","data":"${storeUnitProbe.data}%x","address":"${storeUnitProbe.address}%x","cycle":${simulationTime}}\n"""))
// memory write from other unit
when(otherUnitProbe.valid)(printf(cf"""{"event":"MemoryWrite","lsu_idx":${otherUnitProbe.index},"mask":"${otherUnitProbe.mask}%x","data":"${otherUnitProbe.data}%x","address":"${otherUnitProbe.address}%x","cycle":${simulationTime}}\n"""))
// issue
when(dut.request.fire)(printf(cf"""{"event":"Issue","idx":${t1Probe.instructionCounter},"cycle":${simulationTime}}\n"""))
// check rd
when(dut.response.bits.rd.valid)(printf(cf"""{"event":"CheckRd","data":"${dut.response.bits.data}%x","issue_idx":${t1Probe.responseCounter},"cycle":${simulationTime}}\n"""))
// lsu enq
when(lsuProbe.reqEnq.orR)(printf(cf"""{"event":"LsuEnq","enq":${lsuProbe.reqEnq},"cycle":${simulationTime}}\n"""))

// allocate 2 * chainingSize scoreboards
val vrfWriteScoreboard: Seq[Valid[UInt]] = Seq.tabulate(2 * dut.parameter.chainingSize) { _ => RegInit(0.U.asTypeOf(Valid(UInt(16.W))))}
vrfWriteScoreboard.foreach(scoreboard => dontTouch(scoreboard))
val instructionValid =
(laneProbes.map(laneProbe => laneProbe.instructionValid ## laneProbe.instructionValid) :+
lsuProbe.lsuInstructionValid :+ t1Probe.instructionValid).reduce(_ | _)
val scoreboardEnq = Mux(t1Probe.instructionIssue, UIntToOH(t1Probe.issueTag), 0.U((2 * dut.parameter.chainingSize).W))
vrfWriteScoreboard.zipWithIndex.foreach { case (scoreboard, tag) =>
// allocate 2 * chainingSize scoreboards
val vrfWriteScoreboard: Seq[Valid[UInt]] = Seq.tabulate(2 * generator.parameter.chainingSize) { _ =>
RegInit(0.U.asTypeOf(Valid(UInt(16.W))))
}
vrfWriteScoreboard.foreach(scoreboard => dontTouch(scoreboard))
val instructionValid =
(laneProbes.map(laneProbe => laneProbe.instructionValid ## laneProbe.instructionValid) :+
lsuProbe.lsuInstructionValid :+ t1Probe.instructionValid).reduce(_ | _)
val scoreboardEnq =
Mux(t1Probe.instructionIssue, UIntToOH(t1Probe.issueTag), 0.U((2 * generator.parameter.chainingSize).W))
vrfWriteScoreboard.zipWithIndex.foreach {
case (scoreboard, tag) =>
val writeEnq: UInt = VecInit(
// vrf write from lane
laneProbes.flatMap(laneProbe => laneProbe.slots.map(slot =>
slot.writeTag === tag.U && slot.writeQueueEnq && slot.writeMask.orR
)) ++ laneProbes.flatMap(laneProbe => laneProbe.crossWriteProbe.map(cp =>
cp.bits.writeTag === tag.U && cp.valid && cp.bits.writeMask.orR
)) ++
laneProbes.flatMap(laneProbe =>
laneProbe.slots.map(slot => slot.writeTag === tag.U && slot.writeQueueEnq && slot.writeMask.orR)
) ++ laneProbes.flatMap(laneProbe =>
laneProbe.crossWriteProbe.map(cp => cp.bits.writeTag === tag.U && cp.valid && cp.bits.writeMask.orR)
) ++
// vrf write from lsu
lsuProbe.slots.map(slot => slot.dataInstruction === tag.U && slot.writeValid && slot.dataMask.orR) ++
// vrf write from Sequencer
Some(t1Probe.writeQueueEnq.bits === tag.U && t1Probe.writeQueueEnq.valid && t1Probe.writeQueueEnqMask.orR)
).asUInt
).asUInt
// always equal to array index
scoreboard.bits := scoreboard.bits + PopCount(writeEnq)
when(scoreboard.valid && !instructionValid(tag)){
printf(cf"""{"event":"VrfScoreboardReport","count":${scoreboard.bits},"issue_idx":${tag},"cycle":${simulationTime}}\n""")
when(scoreboard.valid && !instructionValid(tag)) {
printf(
cf"""{"event":"VrfScoreboardReport","count":${scoreboard.bits},"issue_idx":${tag},"cycle":${simulationTime}}\n"""
)
scoreboard.valid := false.B
}
when(scoreboardEnq(tag)) {
scoreboard.valid := true.B
assert(!scoreboard.valid)
scoreboard.bits := 0.U
}
}
}
}
Loading

0 comments on commit f89a4d4

Please sign in to comment.