Skip to content

Commit

Permalink
Don't pack left-hand operand since this is currently only supported f…
Browse files Browse the repository at this point in the history
…or `qc4w` weights, and this benchmark uses `qc8w` weights.

PiperOrigin-RevId: 700264198
  • Loading branch information
gonnet authored and xnnpack-bot committed Nov 26, 2024
1 parent 740a2a7 commit a4e966a
Showing 1 changed file with 5 additions and 5 deletions.
10 changes: 5 additions & 5 deletions bench/models/qd8-attention.cc
Original file line number Diff line number Diff line change
Expand Up @@ -57,8 +57,8 @@ xnn_subgraph_t QD8Attention(size_t batch_size, size_t seq_len,
return nullptr;
}

status = xnn_define_unary(subgraph, xnn_unary_convert, /*params=*/nullptr, input_id, quantized_input_id,
/*XNN_FLAG_MAYBE_PACK_FOR_GEMM=*/0x00000080);
status = xnn_define_unary(subgraph, xnn_unary_convert, /*params=*/nullptr,
input_id, quantized_input_id, /*flags=*/0);
if (status != xnn_status_success) {
std::cerr << "failed to create create convert " << std::endl;
return nullptr;
Expand Down Expand Up @@ -334,9 +334,9 @@ xnn_subgraph_t QD8Attention(size_t batch_size, size_t seq_len,
return nullptr;
}

status =
xnn_define_unary(subgraph, xnn_unary_convert, /*params=*/nullptr, outcome_reshaped_id, quantized_outcome_id,
/*XNN_FLAG_MAYBE_PACK_FOR_GEMM=*/0x00000080);
status = xnn_define_unary(subgraph, xnn_unary_convert, /*params=*/nullptr,
outcome_reshaped_id, quantized_outcome_id,
/*flags=*/0);
if (status != xnn_status_success) {
std::cerr << "failed to create create convert " << std::endl;
return nullptr;
Expand Down

0 comments on commit a4e966a

Please sign in to comment.