tensor: Fix perf counter; comment out dpi
This commit is contained in:
@@ -528,7 +528,7 @@ module VX_tensor_octet #(
|
|||||||
perf_tensor_dpu_total <= '0;
|
perf_tensor_dpu_total <= '0;
|
||||||
end else begin
|
end else begin
|
||||||
if (do_hmma) begin
|
if (do_hmma) begin
|
||||||
perf_tensor_dpu_total <= perf_tensor_dpu_total + 1'b1;
|
perf_tensor_dpu_total <= perf_tensor_dpu_total + 2'd2;
|
||||||
end
|
end
|
||||||
end
|
end
|
||||||
end
|
end
|
||||||
|
|||||||
@@ -24,23 +24,23 @@ module VX_tensor_dpu #(
|
|||||||
output [3:0][3:0][31:0] D_tile,
|
output [3:0][3:0][31:0] D_tile,
|
||||||
output [`NW_WIDTH-1:0] D_wid
|
output [`NW_WIDTH-1:0] D_wid
|
||||||
);
|
);
|
||||||
logic [3:0][3:0][31:0] result_hmma;
|
// logic [3:0][3:0][31:0] result_hmma;
|
||||||
|
|
||||||
always @(*) begin
|
// always @(*) begin
|
||||||
dpi_hmma(valid_in, A_tile, B_tile, C_tile, result_hmma);
|
// dpi_hmma(valid_in, A_tile, B_tile, C_tile, result_hmma);
|
||||||
end
|
// end
|
||||||
|
|
||||||
logic ready_reg;
|
// logic ready_reg;
|
||||||
always @(posedge clk) begin
|
// always @(posedge clk) begin
|
||||||
if (reset) begin
|
// if (reset) begin
|
||||||
ready_reg <= '1;
|
// ready_reg <= '1;
|
||||||
end else if (valid_in && ready_in) begin
|
// end else if (valid_in && ready_in) begin
|
||||||
ready_reg <= '0;
|
// ready_reg <= '0;
|
||||||
dpi_print_results(int'(ISW), int'(OCTET), A_tile, B_tile, C_tile, result_hmma);
|
// dpi_print_results(int'(ISW), int'(OCTET), A_tile, B_tile, C_tile, result_hmma);
|
||||||
end else if (valid_out && ready_out) begin
|
// end else if (valid_out && ready_out) begin
|
||||||
ready_reg <= '1;
|
// ready_reg <= '1;
|
||||||
end
|
// end
|
||||||
end
|
// end
|
||||||
|
|
||||||
// // fixed-latency queue
|
// // fixed-latency queue
|
||||||
// VX_shift_register #(
|
// VX_shift_register #(
|
||||||
|
|||||||
Reference in New Issue
Block a user