Skip to content

Commit

Permalink
lint
Browse files Browse the repository at this point in the history
  • Loading branch information
aciddelgado committed Oct 30, 2023
1 parent 7af984c commit bd4d74c
Show file tree
Hide file tree
Showing 2 changed files with 2 additions and 2 deletions.
2 changes: 1 addition & 1 deletion onnxruntime/contrib_ops/cpu/bert/attention_common.h
Original file line number Diff line number Diff line change
Expand Up @@ -96,7 +96,7 @@ struct GroupQueryAttentionParameters {
int head_size;
int kv_hidden_size;
int kv_num_heads;
int num_splits; // number of splits for splitkv
int num_splits; // number of splits for splitkv
bool is_unidirectional; // causal
float scale;
AttentionQkvFormat qkv_format;
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -195,7 +195,7 @@ std::tuple<int, int, int> get_num_splits_and_buffer_sizes(int batch_size, int se
int max_splits = 128;
// split kv buffers
int num_splits = num_splits_heuristic(batch_size, seqlen_q, seqlen_k, num_heads, head_size,
num_SMs, max_splits);
num_SMs, max_splits);
if (num_splits > 1) {
// softmax_lse_accum buffer
int softmax_lse_accum_bytes = get_softmax_lse_accum_size(num_splits, batch_size, num_heads, seqlen_q);
Expand Down

0 comments on commit bd4d74c

Please sign in to comment.