Skip to content

Commit b4ae700

Browse files
committed
unpack should be u16, add vim swap to gitignore (about time)
1 parent 1730771 commit b4ae700

File tree

3 files changed

+13
-12
lines changed

3 files changed

+13
-12
lines changed

.gitignore

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,7 @@
1818
*.metallib
1919
*.o
2020
*.so
21+
*.swp
2122
*.tmp
2223

2324
# IDE / OS

ggml/src/ggml-vulkan/vulkan-shaders/mul_mat_vec_q4_k.comp

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -47,12 +47,12 @@ void compute_outputs(const uint32_t first_row, const uint32_t num_rows) {
4747
const FLOAT_TYPE dall = FLOAT_TYPE(d.x);
4848
const FLOAT_TYPE dmin = FLOAT_TYPE(d.y);
4949

50-
uint32_t scale0_u32 = data_a_packed16[ib0 + i].scales[v_im ];
51-
uint32_t scale4_u32 = data_a_packed16[ib0 + i].scales[v_im + 2];
52-
uint32_t scale8_u32 = data_a_packed16[ib0 + i].scales[v_im + 4];
53-
uvec2 scale0 = uvec2(unpack8(scale0_u32));
54-
uvec2 scale4 = uvec2(unpack8(scale4_u32));
55-
uvec2 scale8 = uvec2(unpack8(scale8_u32));
50+
uint16_t scale0_u16 = data_a_packed16[ib0 + i].scales[v_im ];
51+
uint16_t scale4_u16 = data_a_packed16[ib0 + i].scales[v_im + 2];
52+
uint16_t scale8_u16 = data_a_packed16[ib0 + i].scales[v_im + 4];
53+
uvec2 scale0 = uvec2(unpack8(scale0_u16));
54+
uvec2 scale4 = uvec2(unpack8(scale4_u16));
55+
uvec2 scale8 = uvec2(unpack8(scale8_u16));
5656

5757
const uint32_t sc0 = ( scale0.x & 0x3f);
5858
const uint32_t sc1 = ( scale0.y & 0x3f);

ggml/src/ggml-vulkan/vulkan-shaders/mul_mat_vec_q5_k.comp

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -46,12 +46,12 @@ void compute_outputs(const uint32_t first_row, const uint32_t num_rows) {
4646
const FLOAT_TYPE dall = FLOAT_TYPE(d.x);
4747
const FLOAT_TYPE dmin = FLOAT_TYPE(d.y);
4848

49-
uint32_t scale0_u32 = data_a_packed16[ib0 + i].scales[v_im ];
50-
uint32_t scale4_u32 = data_a_packed16[ib0 + i].scales[v_im + 2];
51-
uint32_t scale8_u32 = data_a_packed16[ib0 + i].scales[v_im + 4];
52-
uvec2 scale0 = uvec2(unpack8(scale0_u32));
53-
uvec2 scale4 = uvec2(unpack8(scale4_u32));
54-
uvec2 scale8 = uvec2(unpack8(scale8_u32));
49+
uint16_t scale0_u16 = data_a_packed16[ib0 + i].scales[v_im ];
50+
uint16_t scale4_u16 = data_a_packed16[ib0 + i].scales[v_im + 2];
51+
uint16_t scale8_u16 = data_a_packed16[ib0 + i].scales[v_im + 4];
52+
uvec2 scale0 = uvec2(unpack8(scale0_u16));
53+
uvec2 scale4 = uvec2(unpack8(scale4_u16));
54+
uvec2 scale8 = uvec2(unpack8(scale8_u16));
5555

5656
const uint32_t sc0 = ( scale0.x & 0x3f);
5757
const uint32_t sc1 = ( scale0.y & 0x3f);

0 commit comments

Comments
 (0)