tensor: Fix perf counter; comment out dpi

This commit is contained in:
Hansung Kim
2024-05-31 00:32:32 -07:00
parent 73293061ea
commit 0ebbb8e223
2 changed files with 16 additions and 16 deletions

View File

@@ -528,7 +528,7 @@ module VX_tensor_octet #(
perf_tensor_dpu_total <= '0; perf_tensor_dpu_total <= '0;
end else begin end else begin
if (do_hmma) begin if (do_hmma) begin
perf_tensor_dpu_total <= perf_tensor_dpu_total + 1'b1; perf_tensor_dpu_total <= perf_tensor_dpu_total + 2'd2;
end end
end end
end end

View File

@@ -24,23 +24,23 @@ module VX_tensor_dpu #(
output [3:0][3:0][31:0] D_tile, output [3:0][3:0][31:0] D_tile,
output [`NW_WIDTH-1:0] D_wid output [`NW_WIDTH-1:0] D_wid
); );
logic [3:0][3:0][31:0] result_hmma; // logic [3:0][3:0][31:0] result_hmma;
always @(*) begin // always @(*) begin
dpi_hmma(valid_in, A_tile, B_tile, C_tile, result_hmma); // dpi_hmma(valid_in, A_tile, B_tile, C_tile, result_hmma);
end // end
logic ready_reg; // logic ready_reg;
always @(posedge clk) begin // always @(posedge clk) begin
if (reset) begin // if (reset) begin
ready_reg <= '1; // ready_reg <= '1;
end else if (valid_in && ready_in) begin // end else if (valid_in && ready_in) begin
ready_reg <= '0; // ready_reg <= '0;
dpi_print_results(int'(ISW), int'(OCTET), A_tile, B_tile, C_tile, result_hmma); // dpi_print_results(int'(ISW), int'(OCTET), A_tile, B_tile, C_tile, result_hmma);
end else if (valid_out && ready_out) begin // end else if (valid_out && ready_out) begin
ready_reg <= '1; // ready_reg <= '1;
end // end
end // end
// // fixed-latency queue // // fixed-latency queue
// VX_shift_register #( // VX_shift_register #(