2016-11-28 01:16:37 +01:00
|
|
|
// See LICENSE.Berkeley for license details.
|
|
|
|
// See LICENSE.SiFive for license details.
|
2014-09-13 03:06:41 +02:00
|
|
|
|
2013-09-13 07:34:38 +02:00
|
|
|
package rocket
|
|
|
|
|
|
|
|
import Chisel._
|
2016-09-29 01:10:32 +02:00
|
|
|
import Chisel.ImplicitConversions._
|
2016-11-18 23:05:14 +01:00
|
|
|
import config._
|
2017-01-17 03:24:08 +01:00
|
|
|
import coreplex._
|
|
|
|
import diplomacy._
|
|
|
|
import uncore.constants._
|
|
|
|
import uncore.agents._
|
|
|
|
import uncore.coherence._
|
|
|
|
import uncore.devices._
|
|
|
|
import uncore.tilelink._
|
|
|
|
import uncore.tilelink2._
|
|
|
|
import uncore.util._
|
|
|
|
import util._
|
2013-09-13 07:34:38 +02:00
|
|
|
|
2015-10-21 00:02:24 +02:00
|
|
|
case object RoccMaxTaggedMemXacts extends Field[Int]
|
|
|
|
case object RoccNMemChannels extends Field[Int]
|
2016-02-25 07:39:00 +01:00
|
|
|
case object RoccNPTWPorts extends Field[Int]
|
2017-01-17 03:24:08 +01:00
|
|
|
case object BuildRoCC extends Field[Seq[RoccParameters]]
|
|
|
|
|
|
|
|
trait CanHaveLegacyRoccs extends CanHaveSharedFPU with CanHavePTW with TileNetwork {
|
|
|
|
val module: CanHaveLegacyRoccsModule
|
|
|
|
val legacyRocc = if (p(BuildRoCC).isEmpty) None
|
|
|
|
else Some(LazyModule(new LegacyRoccComplex()(p.alter { (site, here, up) => {
|
|
|
|
case CacheBlockOffsetBits => log2Up(site(CacheBlockBytes))
|
|
|
|
case AmoAluOperandBits => site(XLen)
|
|
|
|
case RoccNMemChannels => site(BuildRoCC).map(_.nMemChannels).foldLeft(0)(_ + _)
|
|
|
|
case RoccNPTWPorts => site(BuildRoCC).map(_.nPTWPorts).foldLeft(0)(_ + _)
|
|
|
|
case TLId => "L1toL2"
|
|
|
|
case TLKey("L1toL2") =>
|
|
|
|
TileLinkParameters(
|
|
|
|
coherencePolicy = new MESICoherence(new NullRepresentation(site(NTiles))),
|
|
|
|
nManagers = site(BankedL2Config).nBanks + 1 /* MMIO */,
|
|
|
|
nCachingClients = 1,
|
|
|
|
nCachelessClients = 1,
|
|
|
|
maxClientXacts = List(
|
|
|
|
site(DCacheKey).nMSHRs + 1 /* IOMSHR */,
|
|
|
|
if (site(BuildRoCC).isEmpty) 1 else site(RoccMaxTaggedMemXacts)).max,
|
|
|
|
maxClientsPerPort = if (site(BuildRoCC).isEmpty) 1 else 2,
|
|
|
|
maxManagerXacts = 8,
|
|
|
|
dataBeats = (8 * site(CacheBlockBytes)) / site(XLen),
|
|
|
|
dataBits = site(CacheBlockBytes)*8)
|
|
|
|
}})))
|
|
|
|
|
|
|
|
// TODO for now, all legacy rocc mem ports mapped to one external node
|
|
|
|
legacyRocc foreach { lr =>
|
|
|
|
lr.masterNodes.foreach { l1backend.node := _ }
|
|
|
|
nPTWPorts += lr.nPTWPorts
|
|
|
|
nDCachePorts += lr.nRocc
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
trait CanHaveLegacyRoccsModule extends CanHaveSharedFPUModule with CanHavePTWModule with TileNetworkModule {
|
|
|
|
val outer: CanHaveLegacyRoccs
|
|
|
|
|
|
|
|
fpuOpt foreach { fpu =>
|
|
|
|
outer.legacyRocc.orElse {
|
|
|
|
fpu.io.cp_req.valid := Bool(false)
|
|
|
|
fpu.io.cp_resp.ready := Bool(false)
|
|
|
|
None
|
|
|
|
} foreach { lr =>
|
|
|
|
fpu.io.cp_req <> lr.module.io.fpu.cp_req
|
|
|
|
fpu.io.cp_resp <> lr.module.io.fpu.cp_resp
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
outer.legacyRocc foreach { lr =>
|
|
|
|
ptwPorts ++= lr.module.io.ptw
|
|
|
|
dcachePorts ++= lr.module.io.dcache
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2017-01-19 03:15:24 +01:00
|
|
|
class LegacyRoccComplex(implicit p: Parameters) extends LazyModule {
|
2017-01-17 03:24:08 +01:00
|
|
|
val buildRocc = p(BuildRoCC)
|
|
|
|
val usingRocc = !buildRocc.isEmpty
|
|
|
|
val nRocc = buildRocc.size
|
|
|
|
val nFPUPorts = buildRocc.filter(_.useFPU).size
|
|
|
|
val nMemChannels = buildRocc.map(_.nMemChannels).sum + nRocc
|
|
|
|
val nPTWPorts = buildRocc.map(_.nPTWPorts).sum
|
|
|
|
val roccOpcodes = buildRocc.map(_.opcodes)
|
|
|
|
|
2017-01-19 03:15:24 +01:00
|
|
|
val legacies = List.fill(nMemChannels) { LazyModule(new TLLegacy()(p.alterPartial({ case PAddrBits => 32 }))) }
|
2017-01-17 03:24:08 +01:00
|
|
|
val masterNodes = legacies.map(_ => TLOutputNode())
|
|
|
|
legacies.zip(masterNodes).foreach { case(l,m) => m := TLHintHandler()(l.node) }
|
|
|
|
|
2017-01-19 03:15:24 +01:00
|
|
|
lazy val module = new LazyModuleImp(this) with HasCoreParameters {
|
2017-01-17 03:24:08 +01:00
|
|
|
val io = new Bundle {
|
|
|
|
val tl = masterNodes.map(_.bundleOut)
|
|
|
|
val dcache = Vec(nRocc, new HellaCacheIO)
|
|
|
|
val fpu = new Bundle {
|
|
|
|
val cp_req = Decoupled(new FPInput())
|
|
|
|
val cp_resp = Decoupled(new FPResult()).flip
|
|
|
|
}
|
|
|
|
val ptw = Vec(nPTWPorts, new TLBPTWIO)
|
|
|
|
val core = new Bundle {
|
|
|
|
val cmd = Decoupled(new RoCCCommand).flip
|
|
|
|
val resp = Decoupled(new RoCCResponse)
|
|
|
|
val busy = Bool(OUTPUT)
|
|
|
|
val interrupt = Bool(OUTPUT)
|
|
|
|
val exception = Bool(INPUT)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
val respArb = Module(new RRArbiter(new RoCCResponse, nRocc))
|
|
|
|
io.core.resp <> respArb.io.out
|
|
|
|
|
|
|
|
val cmdRouter = Module(new RoccCommandRouter(roccOpcodes))
|
|
|
|
cmdRouter.io.in <> io.core.cmd
|
|
|
|
|
|
|
|
val roccs = buildRocc.zipWithIndex.map { case (accelParams, i) =>
|
|
|
|
val rocc = accelParams.generator(p.alterPartial({
|
|
|
|
case RoccNMemChannels => accelParams.nMemChannels
|
|
|
|
case RoccNPTWPorts => accelParams.nPTWPorts
|
|
|
|
}))
|
2017-01-19 03:15:24 +01:00
|
|
|
val dcIF = Module(new SimpleHellaCacheIF()(p.alterPartial({ case CacheName => CacheName("L1D") })))
|
2017-01-17 03:24:08 +01:00
|
|
|
rocc.io.cmd <> cmdRouter.io.out(i)
|
|
|
|
rocc.io.exception := io.core.exception
|
|
|
|
dcIF.io.requestor <> rocc.io.mem
|
|
|
|
io.dcache(i) := dcIF.io.cache
|
|
|
|
legacies(i).module.io.legacy <> rocc.io.autl
|
|
|
|
respArb.io.in(i) <> Queue(rocc.io.resp)
|
|
|
|
rocc
|
|
|
|
}
|
|
|
|
|
2017-01-19 03:15:24 +01:00
|
|
|
(nRocc until legacies.size) zip roccs.map(_.io.utl) foreach { case(i, utl) =>
|
2017-01-17 03:24:08 +01:00
|
|
|
legacies(i).module.io.legacy <> utl
|
|
|
|
}
|
|
|
|
io.core.busy := cmdRouter.io.busy || roccs.map(_.io.busy).reduce(_ || _)
|
|
|
|
io.core.interrupt := roccs.map(_.io.interrupt).reduce(_ || _)
|
|
|
|
|
|
|
|
if (usingFPU && nFPUPorts > 0) {
|
|
|
|
val fpArb = Module(new InOrderArbiter(new FPInput, new FPResult, nFPUPorts))
|
|
|
|
val fp_rocc_ios = roccs.zip(buildRocc)
|
|
|
|
.filter { case (_, params) => params.useFPU }
|
|
|
|
.map { case (rocc, _) => rocc.io }
|
|
|
|
fpArb.io.in_req <> fp_rocc_ios.map(_.fpu_req)
|
|
|
|
fp_rocc_ios.zip(fpArb.io.in_resp).foreach {
|
|
|
|
case (rocc, arb) => rocc.fpu_resp <> arb
|
|
|
|
}
|
|
|
|
io.fpu.cp_req <> fpArb.io.out_req
|
|
|
|
fpArb.io.out_resp <> io.fpu.cp_resp
|
|
|
|
} else {
|
|
|
|
io.fpu.cp_req.valid := Bool(false)
|
|
|
|
io.fpu.cp_resp.ready := Bool(false)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
case class RoccParameters(
|
|
|
|
opcodes: OpcodeSet,
|
|
|
|
generator: Parameters => RoCC,
|
|
|
|
nMemChannels: Int = 0,
|
|
|
|
nPTWPorts : Int = 0,
|
|
|
|
useFPU: Boolean = false)
|
2015-03-13 00:27:40 +01:00
|
|
|
|
2013-09-15 00:31:50 +02:00
|
|
|
class RoCCInstruction extends Bundle
|
|
|
|
{
|
|
|
|
val funct = Bits(width = 7)
|
2013-09-22 12:18:06 +02:00
|
|
|
val rs2 = Bits(width = 5)
|
|
|
|
val rs1 = Bits(width = 5)
|
2013-09-15 00:31:50 +02:00
|
|
|
val xd = Bool()
|
|
|
|
val xs1 = Bool()
|
|
|
|
val xs2 = Bool()
|
2013-09-22 12:18:06 +02:00
|
|
|
val rd = Bits(width = 5)
|
2013-09-15 00:31:50 +02:00
|
|
|
val opcode = Bits(width = 7)
|
|
|
|
}
|
|
|
|
|
2015-10-06 06:48:05 +02:00
|
|
|
class RoCCCommand(implicit p: Parameters) extends CoreBundle()(p) {
|
2013-09-15 00:31:50 +02:00
|
|
|
val inst = new RoCCInstruction
|
2015-02-02 05:04:13 +01:00
|
|
|
val rs1 = Bits(width = xLen)
|
|
|
|
val rs2 = Bits(width = xLen)
|
2016-07-19 02:40:50 +02:00
|
|
|
val status = new MStatus
|
2013-09-15 00:31:50 +02:00
|
|
|
}
|
|
|
|
|
2015-10-06 06:48:05 +02:00
|
|
|
class RoCCResponse(implicit p: Parameters) extends CoreBundle()(p) {
|
2013-09-15 00:31:50 +02:00
|
|
|
val rd = Bits(width = 5)
|
2015-02-02 05:04:13 +01:00
|
|
|
val data = Bits(width = xLen)
|
2013-09-15 00:31:50 +02:00
|
|
|
}
|
|
|
|
|
2017-01-17 03:24:08 +01:00
|
|
|
class RoCCCoreIO(implicit p: Parameters) extends CoreBundle()(p) {
|
2013-09-15 00:31:50 +02:00
|
|
|
val cmd = Decoupled(new RoCCCommand).flip
|
|
|
|
val resp = Decoupled(new RoCCResponse)
|
2016-11-30 03:49:40 +01:00
|
|
|
val mem = new HellaCacheIO
|
2014-01-29 07:13:16 +01:00
|
|
|
val busy = Bool(OUTPUT)
|
|
|
|
val interrupt = Bool(OUTPUT)
|
2017-01-17 03:24:08 +01:00
|
|
|
val exception = Bool(INPUT)
|
2016-11-30 03:49:40 +01:00
|
|
|
|
2017-01-17 03:24:08 +01:00
|
|
|
override def cloneType = new RoCCCoreIO()(p).asInstanceOf[this.type]
|
|
|
|
}
|
|
|
|
|
|
|
|
class RoCCIO(implicit p: Parameters) extends RoCCCoreIO()(p) {
|
2014-01-29 07:13:16 +01:00
|
|
|
// These should be handled differently, eventually
|
2015-12-03 01:28:23 +01:00
|
|
|
val autl = new ClientUncachedTileLinkIO
|
|
|
|
val utl = Vec(p(RoccNMemChannels), new ClientUncachedTileLinkIO)
|
2016-02-25 07:39:00 +01:00
|
|
|
val ptw = Vec(p(RoccNPTWPorts), new TLBPTWIO)
|
2015-04-02 10:30:11 +02:00
|
|
|
val fpu_req = Decoupled(new FPInput)
|
|
|
|
val fpu_resp = Decoupled(new FPResult).flip
|
2016-01-13 00:36:16 +01:00
|
|
|
|
2017-01-17 03:24:08 +01:00
|
|
|
override def cloneType = new RoCCIO()(p).asInstanceOf[this.type]
|
2013-09-15 00:31:50 +02:00
|
|
|
}
|
|
|
|
|
2015-10-06 06:48:05 +02:00
|
|
|
abstract class RoCC(implicit p: Parameters) extends CoreModule()(p) {
|
2017-01-17 03:24:08 +01:00
|
|
|
val io = new RoCCIO
|
2013-09-24 22:53:49 +02:00
|
|
|
io.mem.req.bits.phys := Bool(true) // don't perform address translation
|
2016-08-31 18:44:32 +02:00
|
|
|
io.mem.invalidate_lr := Bool(false) // don't mess with LR/SC
|
2013-09-15 00:31:50 +02:00
|
|
|
}
|
|
|
|
|
2015-10-06 06:48:05 +02:00
|
|
|
class AccumulatorExample(n: Int = 4)(implicit p: Parameters) extends RoCC()(p) {
|
2015-11-25 23:04:28 +01:00
|
|
|
val regfile = Mem(n, UInt(width = xLen))
|
|
|
|
val busy = Reg(init = Vec.fill(n){Bool(false)})
|
2013-09-15 00:31:50 +02:00
|
|
|
|
2013-09-15 07:34:53 +02:00
|
|
|
val cmd = Queue(io.cmd)
|
|
|
|
val funct = cmd.bits.inst.funct
|
2015-11-25 23:04:28 +01:00
|
|
|
val addr = cmd.bits.rs2(log2Up(n)-1,0)
|
2013-09-15 07:34:53 +02:00
|
|
|
val doWrite = funct === UInt(0)
|
|
|
|
val doRead = funct === UInt(1)
|
|
|
|
val doLoad = funct === UInt(2)
|
|
|
|
val doAccum = funct === UInt(3)
|
|
|
|
val memRespTag = io.mem.resp.bits.tag(log2Up(n)-1,0)
|
|
|
|
|
|
|
|
// datapath
|
|
|
|
val addend = cmd.bits.rs1
|
2013-09-15 00:31:50 +02:00
|
|
|
val accum = regfile(addr)
|
2013-09-15 07:34:53 +02:00
|
|
|
val wdata = Mux(doWrite, addend, accum + addend)
|
2013-09-15 00:31:50 +02:00
|
|
|
|
2013-09-15 07:34:53 +02:00
|
|
|
when (cmd.fire() && (doWrite || doAccum)) {
|
2013-09-15 00:31:50 +02:00
|
|
|
regfile(addr) := wdata
|
|
|
|
}
|
|
|
|
|
2013-09-15 07:34:53 +02:00
|
|
|
when (io.mem.resp.valid) {
|
|
|
|
regfile(memRespTag) := io.mem.resp.bits.data
|
2016-08-04 20:17:13 +02:00
|
|
|
busy(memRespTag) := Bool(false)
|
2013-09-15 07:34:53 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
// control
|
|
|
|
when (io.mem.req.fire()) {
|
|
|
|
busy(addr) := Bool(true)
|
|
|
|
}
|
|
|
|
|
|
|
|
val doResp = cmd.bits.inst.xd
|
|
|
|
val stallReg = busy(addr)
|
|
|
|
val stallLoad = doLoad && !io.mem.req.ready
|
|
|
|
val stallResp = doResp && !io.resp.ready
|
|
|
|
|
2013-09-24 19:54:09 +02:00
|
|
|
cmd.ready := !stallReg && !stallLoad && !stallResp
|
2013-09-23 09:21:43 +02:00
|
|
|
// command resolved if no stalls AND not issuing a load that will need a request
|
|
|
|
|
2013-09-25 01:32:49 +02:00
|
|
|
// PROC RESPONSE INTERFACE
|
2013-09-24 19:54:09 +02:00
|
|
|
io.resp.valid := cmd.valid && doResp && !stallReg && !stallLoad
|
|
|
|
// valid response if valid command, need a response, and no stalls
|
2013-09-15 07:34:53 +02:00
|
|
|
io.resp.bits.rd := cmd.bits.inst.rd
|
2013-09-25 01:32:49 +02:00
|
|
|
// Must respond with the appropriate tag or undefined behavior
|
|
|
|
io.resp.bits.data := accum
|
|
|
|
// Semantics is to always send out prior accumulator register value
|
2013-09-15 07:34:53 +02:00
|
|
|
|
2013-09-25 01:32:49 +02:00
|
|
|
io.busy := cmd.valid || busy.reduce(_||_)
|
|
|
|
// Be busy when have pending memory requests or committed possibility of pending requests
|
2013-09-15 00:31:50 +02:00
|
|
|
io.interrupt := Bool(false)
|
2013-09-25 01:32:49 +02:00
|
|
|
// Set this true to trigger an interrupt on the processor (please refer to supervisor documentation)
|
2013-09-15 07:34:53 +02:00
|
|
|
|
2013-09-25 01:32:49 +02:00
|
|
|
// MEMORY REQUEST INTERFACE
|
2013-09-24 19:54:09 +02:00
|
|
|
io.mem.req.valid := cmd.valid && doLoad && !stallReg && !stallResp
|
2013-09-15 07:34:53 +02:00
|
|
|
io.mem.req.bits.addr := addend
|
2013-09-24 19:54:09 +02:00
|
|
|
io.mem.req.bits.tag := addr
|
2013-09-15 07:34:53 +02:00
|
|
|
io.mem.req.bits.cmd := M_XRD // perform a load (M_XWR for stores)
|
|
|
|
io.mem.req.bits.typ := MT_D // D = 8 bytes, W = 4, H = 2, B = 1
|
|
|
|
io.mem.req.bits.data := Bits(0) // we're not performing any stores...
|
2014-05-15 01:17:39 +02:00
|
|
|
|
2015-12-03 01:28:23 +01:00
|
|
|
io.autl.acquire.valid := false
|
|
|
|
io.autl.grant.ready := false
|
2013-09-15 00:31:50 +02:00
|
|
|
}
|
2015-11-26 01:02:27 +01:00
|
|
|
|
|
|
|
class TranslatorExample(implicit p: Parameters) extends RoCC()(p) {
|
|
|
|
val req_addr = Reg(UInt(width = coreMaxAddrBits))
|
|
|
|
val req_rd = Reg(io.resp.bits.rd)
|
|
|
|
val req_offset = req_addr(pgIdxBits - 1, 0)
|
|
|
|
val req_vpn = req_addr(coreMaxAddrBits - 1, pgIdxBits)
|
2016-03-03 08:29:58 +01:00
|
|
|
val pte = Reg(new PTE)
|
2015-11-26 01:02:27 +01:00
|
|
|
|
|
|
|
val s_idle :: s_ptw_req :: s_ptw_resp :: s_resp :: Nil = Enum(Bits(), 4)
|
|
|
|
val state = Reg(init = s_idle)
|
|
|
|
|
|
|
|
io.cmd.ready := (state === s_idle)
|
|
|
|
|
|
|
|
when (io.cmd.fire()) {
|
|
|
|
req_rd := io.cmd.bits.inst.rd
|
|
|
|
req_addr := io.cmd.bits.rs1
|
|
|
|
state := s_ptw_req
|
|
|
|
}
|
|
|
|
|
2016-02-25 07:39:00 +01:00
|
|
|
private val ptw = io.ptw(0)
|
2015-11-26 01:02:27 +01:00
|
|
|
|
2016-02-25 07:39:00 +01:00
|
|
|
when (ptw.req.fire()) { state := s_ptw_resp }
|
|
|
|
|
|
|
|
when (state === s_ptw_resp && ptw.resp.valid) {
|
2016-03-03 08:29:58 +01:00
|
|
|
pte := ptw.resp.bits.pte
|
2015-11-26 01:02:27 +01:00
|
|
|
state := s_resp
|
|
|
|
}
|
|
|
|
|
|
|
|
when (io.resp.fire()) { state := s_idle }
|
|
|
|
|
2016-02-25 07:39:00 +01:00
|
|
|
ptw.req.valid := (state === s_ptw_req)
|
|
|
|
ptw.req.bits.addr := req_vpn
|
|
|
|
ptw.req.bits.store := Bool(false)
|
|
|
|
ptw.req.bits.fetch := Bool(false)
|
2015-11-26 01:02:27 +01:00
|
|
|
|
|
|
|
io.resp.valid := (state === s_resp)
|
|
|
|
io.resp.bits.rd := req_rd
|
2016-08-04 20:17:13 +02:00
|
|
|
io.resp.bits.data := Mux(pte.leaf(), Cat(pte.ppn, req_offset), SInt(-1, xLen).asUInt)
|
2015-11-26 01:02:27 +01:00
|
|
|
|
|
|
|
io.busy := (state =/= s_idle)
|
|
|
|
io.interrupt := Bool(false)
|
|
|
|
io.mem.req.valid := Bool(false)
|
2015-12-03 01:28:23 +01:00
|
|
|
io.autl.acquire.valid := Bool(false)
|
|
|
|
io.autl.grant.ready := Bool(false)
|
2015-11-26 01:02:27 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
class CharacterCountExample(implicit p: Parameters) extends RoCC()(p)
|
|
|
|
with HasTileLinkParameters {
|
|
|
|
|
|
|
|
private val blockOffset = tlBeatAddrBits + tlByteAddrBits
|
|
|
|
|
|
|
|
val needle = Reg(UInt(width = 8))
|
|
|
|
val addr = Reg(UInt(width = coreMaxAddrBits))
|
|
|
|
val count = Reg(UInt(width = xLen))
|
|
|
|
val resp_rd = Reg(io.resp.bits.rd)
|
|
|
|
|
|
|
|
val addr_block = addr(coreMaxAddrBits - 1, blockOffset)
|
|
|
|
val offset = addr(blockOffset - 1, 0)
|
|
|
|
val next_addr = (addr_block + UInt(1)) << UInt(blockOffset)
|
|
|
|
|
|
|
|
val s_idle :: s_acq :: s_gnt :: s_check :: s_resp :: Nil = Enum(Bits(), 5)
|
|
|
|
val state = Reg(init = s_idle)
|
|
|
|
|
2015-12-03 01:28:23 +01:00
|
|
|
val gnt = io.autl.grant.bits
|
2015-11-26 01:02:27 +01:00
|
|
|
val recv_data = Reg(UInt(width = tlDataBits))
|
|
|
|
val recv_beat = Reg(UInt(width = tlBeatAddrBits))
|
|
|
|
|
|
|
|
val data_bytes = Vec.tabulate(tlDataBytes) { i => recv_data(8 * (i + 1) - 1, 8 * i) }
|
|
|
|
val zero_match = data_bytes.map(_ === UInt(0))
|
|
|
|
val needle_match = data_bytes.map(_ === needle)
|
|
|
|
val first_zero = PriorityEncoder(zero_match)
|
|
|
|
|
|
|
|
val chars_found = PopCount(needle_match.zipWithIndex.map {
|
|
|
|
case (matches, i) =>
|
|
|
|
val idx = Cat(recv_beat, UInt(i, tlByteAddrBits))
|
|
|
|
matches && idx >= offset && UInt(i) <= first_zero
|
|
|
|
})
|
|
|
|
val zero_found = zero_match.reduce(_ || _)
|
|
|
|
val finished = Reg(Bool())
|
|
|
|
|
|
|
|
io.cmd.ready := (state === s_idle)
|
|
|
|
io.resp.valid := (state === s_resp)
|
|
|
|
io.resp.bits.rd := resp_rd
|
|
|
|
io.resp.bits.data := count
|
2015-12-03 01:28:23 +01:00
|
|
|
io.autl.acquire.valid := (state === s_acq)
|
|
|
|
io.autl.acquire.bits := GetBlock(addr_block = addr_block)
|
|
|
|
io.autl.grant.ready := (state === s_gnt)
|
2015-11-26 01:02:27 +01:00
|
|
|
|
|
|
|
when (io.cmd.fire()) {
|
|
|
|
addr := io.cmd.bits.rs1
|
|
|
|
needle := io.cmd.bits.rs2
|
|
|
|
resp_rd := io.cmd.bits.inst.rd
|
|
|
|
count := UInt(0)
|
|
|
|
finished := Bool(false)
|
|
|
|
state := s_acq
|
|
|
|
}
|
|
|
|
|
2015-12-03 01:28:23 +01:00
|
|
|
when (io.autl.acquire.fire()) { state := s_gnt }
|
2015-11-26 01:02:27 +01:00
|
|
|
|
2015-12-03 01:28:23 +01:00
|
|
|
when (io.autl.grant.fire()) {
|
2015-11-26 01:02:27 +01:00
|
|
|
recv_beat := gnt.addr_beat
|
|
|
|
recv_data := gnt.data
|
|
|
|
state := s_check
|
|
|
|
}
|
|
|
|
|
|
|
|
when (state === s_check) {
|
|
|
|
when (!finished) {
|
|
|
|
count := count + chars_found
|
|
|
|
}
|
|
|
|
when (zero_found) { finished := Bool(true) }
|
|
|
|
when (recv_beat === UInt(tlDataBeats - 1)) {
|
|
|
|
addr := next_addr
|
|
|
|
state := Mux(zero_found || finished, s_resp, s_acq)
|
|
|
|
} .otherwise {
|
|
|
|
state := s_gnt
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
when (io.resp.fire()) { state := s_idle }
|
|
|
|
|
|
|
|
io.busy := (state =/= s_idle)
|
|
|
|
io.interrupt := Bool(false)
|
|
|
|
io.mem.req.valid := Bool(false)
|
|
|
|
}
|
|
|
|
|
|
|
|
class OpcodeSet(val opcodes: Seq[UInt]) {
|
|
|
|
def |(set: OpcodeSet) =
|
|
|
|
new OpcodeSet(this.opcodes ++ set.opcodes)
|
|
|
|
|
|
|
|
def matches(oc: UInt) = opcodes.map(_ === oc).reduce(_ || _)
|
|
|
|
}
|
|
|
|
|
|
|
|
object OpcodeSet {
|
|
|
|
val custom0 = new OpcodeSet(Seq(Bits("b0001011")))
|
|
|
|
val custom1 = new OpcodeSet(Seq(Bits("b0101011")))
|
|
|
|
val custom2 = new OpcodeSet(Seq(Bits("b1011011")))
|
|
|
|
val custom3 = new OpcodeSet(Seq(Bits("b1111011")))
|
|
|
|
val all = custom0 | custom1 | custom2 | custom3
|
|
|
|
}
|
|
|
|
|
|
|
|
class RoccCommandRouter(opcodes: Seq[OpcodeSet])(implicit p: Parameters)
|
|
|
|
extends CoreModule()(p) {
|
|
|
|
val io = new Bundle {
|
|
|
|
val in = Decoupled(new RoCCCommand).flip
|
|
|
|
val out = Vec(opcodes.size, Decoupled(new RoCCCommand))
|
|
|
|
val busy = Bool(OUTPUT)
|
|
|
|
}
|
|
|
|
|
|
|
|
val cmd = Queue(io.in)
|
|
|
|
val cmdReadys = io.out.zip(opcodes).map { case (out, opcode) =>
|
|
|
|
val me = opcode.matches(cmd.bits.inst.opcode)
|
|
|
|
out.valid := cmd.valid && me
|
|
|
|
out.bits := cmd.bits
|
|
|
|
out.ready && me
|
|
|
|
}
|
|
|
|
cmd.ready := cmdReadys.reduce(_ || _)
|
|
|
|
io.busy := cmd.valid
|
|
|
|
|
|
|
|
assert(PopCount(cmdReadys) <= UInt(1),
|
|
|
|
"Custom opcode matched for more than one accelerator")
|
|
|
|
}
|