Skip to content

Commit

Permalink
fix for review comments
Browse files Browse the repository at this point in the history
  • Loading branch information
kailums committed Jun 27, 2024
1 parent a5581e4 commit 7db65da
Showing 1 changed file with 5 additions and 5 deletions.
10 changes: 5 additions & 5 deletions onnxruntime/core/providers/cuda/tensor/split_impl.cu
Original file line number Diff line number Diff line change
Expand Up @@ -227,7 +227,7 @@ Status Split3Inner(cudaStream_t stream, const size_t element_size, const int64_t

// determine threads based on the size of the output
auto threadsPerBlock = kNumThreadsPerBlock;
if ((inner_size_in_byte / VEC_SIZE) < 128) {
if ((inner_size_in_byte / VEC_SIZE) <= 128) {
// use less threads when the size is small
threadsPerBlock = 128;
}
Expand All @@ -247,16 +247,16 @@ Status Split3Inner(cudaStream_t stream, const size_t element_size, const int64_t
CASE_ELEMENT_TYPE(int4);
break;
case 8:
CASE_ELEMENT_TYPE(int2);
CASE_ELEMENT_TYPE(int64_t);
break;
case 4:
CASE_ELEMENT_TYPE(int1);
CASE_ELEMENT_TYPE(int32_t);
break;
case 2:
CASE_ELEMENT_TYPE(short1);
CASE_ELEMENT_TYPE(int16_t);
break;
default:
CASE_ELEMENT_TYPE(char1);
CASE_ELEMENT_TYPE(int8_t);
break;
#undef CASE_ELEMENT_TYPE
}
Expand Down

0 comments on commit 7db65da

Please sign in to comment.