1
0

add FP recoding

This commit is contained in:
Andrew Waterman 2012-02-12 23:31:50 -08:00
parent 25ecfb9bbc
commit 069037ff3a
4 changed files with 72 additions and 7 deletions

View File

@ -105,6 +105,7 @@ class rocketProc extends Component
dpath.io.dmem.resp_val := arb.io.cpu.resp_val; dpath.io.dmem.resp_val := arb.io.cpu.resp_val;
dpath.io.dmem.resp_miss := arb.io.cpu.resp_miss; dpath.io.dmem.resp_miss := arb.io.cpu.resp_miss;
dpath.io.dmem.resp_replay := arb.io.cpu.resp_replay; dpath.io.dmem.resp_replay := arb.io.cpu.resp_replay;
dpath.io.dmem.resp_type := io.dmem.resp_type;
dpath.io.dmem.resp_tag := arb.io.cpu.resp_tag; dpath.io.dmem.resp_tag := arb.io.cpu.resp_tag;
dpath.io.dmem.resp_data := arb.io.cpu.resp_data; dpath.io.dmem.resp_data := arb.io.cpu.resp_data;
dpath.io.dmem.resp_data_subword := io.dmem.resp_data_subword; dpath.io.dmem.resp_data_subword := io.dmem.resp_data_subword;

View File

@ -15,6 +15,7 @@ class ioDpathDmem extends Bundle()
val resp_val = Bool(INPUT); val resp_val = Bool(INPUT);
val resp_miss = Bool(INPUT); val resp_miss = Bool(INPUT);
val resp_replay = Bool(INPUT); val resp_replay = Bool(INPUT);
val resp_type = Bits(3, INPUT);
val resp_tag = Bits(CPU_TAG_BITS, INPUT); val resp_tag = Bits(CPU_TAG_BITS, INPUT);
val resp_data = Bits(64, INPUT); val resp_data = Bits(64, INPUT);
val resp_data_subword = Bits(64, INPUT); val resp_data_subword = Bits(64, INPUT);
@ -400,6 +401,7 @@ class rocketDpath extends Component
io.fpu.dmem_resp_val := io.dmem.resp_val && dmem_resp_fpu io.fpu.dmem_resp_val := io.dmem.resp_val && dmem_resp_fpu
io.fpu.dmem_resp_data := io.dmem.resp_data io.fpu.dmem_resp_data := io.dmem.resp_data
io.fpu.dmem_resp_type := io.dmem.resp_type
io.fpu.dmem_resp_tag := dmem_resp_waddr io.fpu.dmem_resp_tag := dmem_resp_waddr
// writeback stage // writeback stage

View File

@ -176,6 +176,7 @@ class ioDpathFPU extends Bundle {
val toint_data = Bits(64, INPUT) val toint_data = Bits(64, INPUT)
val dmem_resp_val = Bool(OUTPUT) val dmem_resp_val = Bool(OUTPUT)
val dmem_resp_type = Bits(3, OUTPUT)
val dmem_resp_tag = UFix(5, OUTPUT) val dmem_resp_tag = UFix(5, OUTPUT)
val dmem_resp_data = Bits(64, OUTPUT) val dmem_resp_data = Bits(64, OUTPUT)
} }
@ -200,10 +201,12 @@ class rocketFPIntUnit extends Component
val exc = Bits(5, OUTPUT) val exc = Bits(5, OUTPUT)
} }
val unrecoded_s = io.in(31,0) val unrec_s = new hardfloat.recodedFloat32ToFloat32
val unrecoded_d = io.in val unrec_d = new hardfloat.recodedFloat64ToFloat64
unrec_s.io.in := io.in
unrec_d.io.in := io.in
io.store_data := Mux(io.single, Cat(unrecoded_s, unrecoded_s), unrecoded_d) io.store_data := Mux(io.single, Cat(unrec_s.io.out, unrec_s.io.out), unrec_d.io.out)
val scmp = Bool(false) val scmp = Bool(false)
val scmp_exc = Bits(0) val scmp_exc = Bits(0)
@ -219,10 +222,10 @@ class rocketFPIntUnit extends Component
// output muxing // output muxing
val (out_s, exc_s) = (Wire() { Bits() }, Wire() { Bits() }) val (out_s, exc_s) = (Wire() { Bits() }, Wire() { Bits() })
out_s := Cat(Fill(32, unrecoded_s(31)), unrecoded_s) out_s := Cat(Fill(32, unrec_s.io.out(31)), unrec_s.io.out)
exc_s := Bits(0) exc_s := Bits(0)
val (out_d, exc_d) = (Wire() { Bits() }, Wire() { Bits() }) val (out_d, exc_d) = (Wire() { Bits() }, Wire() { Bits() })
out_d := unrecoded_d out_d := unrec_d.io.out
exc_d := Bits(0) exc_d := Bits(0)
when (io.cmd === FCMD_MTFSR || io.cmd === FCMD_MFFSR) { when (io.cmd === FCMD_MTFSR || io.cmd === FCMD_MFFSR) {
@ -251,6 +254,51 @@ class rocketFPIntUnit extends Component
io.exc := Mux(io.single, exc_s, exc_d) io.exc := Mux(io.single, exc_s, exc_d)
} }
class rocketIntFPUnit extends Component
{
val io = new Bundle {
val single = Bool(INPUT)
val cmd = Bits(FCMD_WIDTH, INPUT)
val fsr = Bits(FSR_WIDTH, INPUT)
val in = Bits(64, INPUT)
val out = Bits(65, OUTPUT)
val exc = Bits(5, OUTPUT)
}
val rec_s = new hardfloat.float32ToRecodedFloat32
val rec_d = new hardfloat.float64ToRecodedFloat64
rec_s.io.in := io.in
rec_d.io.in := io.in
val i2s = Bits(0)
val i2s_exc = Bits(0)
val i2d = Bits(0)
val i2d_exc = Bits(0)
// output muxing
val (out_s, exc_s) = (Wire() { Bits() }, Wire() { Bits() })
out_s := rec_s.io.out
exc_s := Bits(0)
val (out_d, exc_d) = (Wire() { Bits() }, Wire() { Bits() })
out_d := rec_d.io.out
exc_d := Bits(0)
when (io.cmd === FCMD_CVT_FMT_W || io.cmd === FCMD_CVT_FMT_WU ||
io.cmd === FCMD_CVT_FMT_L || io.cmd === FCMD_CVT_FMT_LU) {
out_s := i2s
exc_s := i2s_exc
out_d := i2d
exc_d := i2d_exc
}
when (io.cmd === FCMD_MTFSR || io.cmd === FCMD_MFFSR) {
out_s := Cat(out_s(32,FSR_WIDTH), io.in(FSR_WIDTH-1,0))
}
io.out := Mux(io.single, Cat(Fill(32,UFix(1)), out_s), out_d)
io.exc := Mux(io.single, exc_s, exc_d)
}
class rocketFPU extends Component class rocketFPU extends Component
{ {
val io = new Bundle { val io = new Bundle {
@ -274,18 +322,25 @@ class rocketFPU extends Component
// load response // load response
val load_wb = Reg(io.dpath.dmem_resp_val, resetVal = Bool(false)) val load_wb = Reg(io.dpath.dmem_resp_val, resetVal = Bool(false))
val load_wb_single = Reg() { Bool() }
val load_wb_data = Reg() { Bits(width = 64) } // XXX WTF why doesn't bit width inference work for the regfile?! val load_wb_data = Reg() { Bits(width = 64) } // XXX WTF why doesn't bit width inference work for the regfile?!
val load_wb_tag = Reg() { UFix() } val load_wb_tag = Reg() { UFix() }
when (io.dpath.dmem_resp_val) { when (io.dpath.dmem_resp_val) {
load_wb_single := io.dpath.dmem_resp_type === MT_W || io.dpath.dmem_resp_type === MT_WU
load_wb_data := io.dpath.dmem_resp_data load_wb_data := io.dpath.dmem_resp_data
load_wb_tag := io.dpath.dmem_resp_tag load_wb_tag := io.dpath.dmem_resp_tag
} }
val rec_s = new hardfloat.float32ToRecodedFloat32
val rec_d = new hardfloat.float64ToRecodedFloat64
rec_s.io.in := load_wb_data
rec_d.io.in := load_wb_data
val load_wb_data_recoded = Mux(load_wb_single, Cat(Fill(32,UFix(1)), rec_s.io.out), rec_d.io.out)
val fsr_rm = Reg() { Bits(width = 3) } val fsr_rm = Reg() { Bits(width = 3) }
val fsr_exc = Reg() { Bits(width = 5) } val fsr_exc = Reg() { Bits(width = 5) }
// regfile // regfile
val regfile = Mem(32, load_wb, load_wb_tag, load_wb_data); val regfile = Mem(32, load_wb, load_wb_tag, load_wb_data_recoded);
regfile.setReadLatency(0); regfile.setReadLatency(0);
regfile.setTarget('inst); regfile.setTarget('inst);
@ -332,10 +387,15 @@ class rocketFPU extends Component
io.dpath.store_data := fpiu.io.store_data io.dpath.store_data := fpiu.io.store_data
io.dpath.toint_data := fpiu.io.toint_data io.dpath.toint_data := fpiu.io.toint_data
val ifpu = new rocketIntFPUnit
ifpu.io.single := ctrl.single
ifpu.io.cmd := ctrl.cmd
ifpu.io.in := fp_fromint_data
val retire_toint = Reg(!io.ctrl.killm && fp_toint_val, resetVal = Bool(false)) val retire_toint = Reg(!io.ctrl.killm && fp_toint_val, resetVal = Bool(false))
val retire_toint_exc = Reg(fpiu.io.exc) val retire_toint_exc = Reg(fpiu.io.exc)
val retire_fromint = Reg(!io.ctrl.killm && fp_fromint_val, resetVal = Bool(false)) val retire_fromint = Reg(!io.ctrl.killm && fp_fromint_val, resetVal = Bool(false))
val retire_fromint_wdata = Reg(fp_fromint_data) val retire_fromint_wdata = Reg(ifpu.io.out)
val retire_fromint_waddr = Reg(fp_waddr) val retire_fromint_waddr = Reg(fp_waddr)
when (retire_toint) { when (retire_toint) {

View File

@ -667,6 +667,7 @@ class ioDmem(view: List[String] = null) extends Bundle(view) {
val resp_nack = Bool(OUTPUT); val resp_nack = Bool(OUTPUT);
val resp_val = Bool(OUTPUT); val resp_val = Bool(OUTPUT);
val resp_replay = Bool(OUTPUT); val resp_replay = Bool(OUTPUT);
val resp_type = Bits(3, OUTPUT);
val resp_data = Bits(64, OUTPUT); val resp_data = Bits(64, OUTPUT);
val resp_data_subword = Bits(64, OUTPUT); val resp_data_subword = Bits(64, OUTPUT);
val resp_tag = Bits(DCACHE_TAG_BITS, OUTPUT); val resp_tag = Bits(DCACHE_TAG_BITS, OUTPUT);
@ -967,6 +968,7 @@ class HellaCache extends Component {
io.cpu.resp_replay := replayer.io.cpu_resp_val io.cpu.resp_replay := replayer.io.cpu_resp_val
io.cpu.resp_miss := tag_miss && !nack_miss && r_req_read io.cpu.resp_miss := tag_miss && !nack_miss && r_req_read
io.cpu.resp_tag := Mux(replayer.io.cpu_resp_val, replayer.io.cpu_resp_tag, r_cpu_req_tag) io.cpu.resp_tag := Mux(replayer.io.cpu_resp_val, replayer.io.cpu_resp_tag, r_cpu_req_tag)
io.cpu.resp_type := loadgen.io.typ
io.cpu.resp_data := loadgen.io.dout io.cpu.resp_data := loadgen.io.dout
io.cpu.resp_data_subword := loadgen.io.r_dout_subword io.cpu.resp_data_subword := loadgen.io.r_dout_subword