Skip to content

Commit b83e149

Browse files
cuda : get_row_rounding F32 (#4095)
* Fix #4017 * Update ggml-cuda.cu Co-authored-by: Jared Van Bortel <[email protected]> * Update ggml-cuda.cu Co-authored-by: Jared Van Bortel <[email protected]> --------- Co-authored-by: Jared Van Bortel <[email protected]>
1 parent 4f447a4 commit b83e149

File tree

1 file changed

+2
-0
lines changed

1 file changed

+2
-0
lines changed

ggml-cuda.cu

+2
Original file line numberDiff line numberDiff line change
@@ -6356,6 +6356,7 @@ static int64_t get_row_rounding(ggml_type type) {
63566356
case GGML_TYPE_Q8_0:
63576357
return max_compute_capability >= CC_RDNA2 ? 128 : 64;
63586358
case GGML_TYPE_F16:
6359+
case GGML_TYPE_F32:
63596360
return 1;
63606361
case GGML_TYPE_Q2_K:
63616362
return max_compute_capability >= CC_RDNA2 ? 128 : 32;
@@ -6378,6 +6379,7 @@ static int64_t get_row_rounding(ggml_type type) {
63786379
case GGML_TYPE_Q8_0:
63796380
return 64;
63806381
case GGML_TYPE_F16:
6382+
case GGML_TYPE_F32:
63816383
return 1;
63826384
case GGML_TYPE_Q2_K:
63836385
case GGML_TYPE_Q3_K:

0 commit comments

Comments
 (0)