tensor: Decode rd of macro-op to designate additional accumulator

This is useful when you want to have the tensor core output to multiple
accumulator registers, e.g. when doing outer product within the RF.
This commit is contained in:
Hansung Kim
2024-05-31 19:17:56 -07:00
parent 0ebbb8e223
commit 9caafb2d8a
2 changed files with 20 additions and 4 deletions

View File

@@ -545,6 +545,12 @@ module VX_decode #(
`INST_EXT4: begin
ex_type = `EX_TENSOR;
op_type = `INST_TENSOR_HMMA;
// tensor core macroop is encoded as r-type
use_rd = 1;
`USED_IREG (rd);
`USED_IREG (rs1);
`USED_IREG (rs2);
`USED_IREG (rs3);
end
`endif
default:;