Skip to content

Commit

Permalink
lint
Browse files Browse the repository at this point in the history
  • Loading branch information
aciddelgado committed Nov 7, 2023
1 parent 4b3bec1 commit 4a96881
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions onnxruntime/contrib_ops/cuda/bert/group_query_attention.h
Original file line number Diff line number Diff line change
Expand Up @@ -20,8 +20,8 @@ class GroupQueryAttention final : public CudaKernel {
Status ComputeInternal(OpKernelContext* context) const override;

protected:
int num_heads_; // number of attention heads
int kv_num_heads_; // different for k and v for group query attention
int num_heads_; // number of attention heads
int kv_num_heads_; // different for k and v for group query attention
// bool left_padding_; // shifts last token to end of buffer
bool is_unidirectional_; // causal
bool is_past_bsnh_;
Expand Down

0 comments on commit 4a96881

Please sign in to comment.