We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent f8e5813 commit 05697f6Copy full SHA for 05697f6
ggml/src/ggml-metal.metal
@@ -19,18 +19,12 @@ constexpr constant static float kvalues_iq4nl_f[16] = {
19
// NOTE: this is not dequantizing - we are simply fitting the template
20
template <typename type4x4>
21
void dequantize_f32(device const float4x4 * src, short il, thread type4x4 & reg) {
22
- float4x4 temp = *(((device float4x4 *)src));
23
- for (int i = 0; i < 16; i++){
24
- reg[i/4][i%4] = temp[i/4][i%4];
25
- }
+ reg = (type4x4)(*src);
26
}
27
28
29
void dequantize_f16(device const half4x4 * src, short il, thread type4x4 & reg) {
30
- half4x4 temp = *(((device half4x4 *)src));
31
32
33
34
35
36
0 commit comments