Skip to content

Commit c1f8850

Browse files
swggerganov
andauthored
ggml : introduce structs for the q4 data blocks (#356)
* Introduce structs for the q4 data blocks * ggml : rename quant struct variables + fix ARM_NEON --------- Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
1 parent e067026 commit c1f8850

File tree

6 files changed

+150
-235
lines changed

6 files changed

+150
-235
lines changed

examples/quantize/quantize.cpp

+1-3
Original file line numberDiff line numberDiff line change
@@ -4,8 +4,6 @@
44
#include <cstdio>
55
#include <string>
66

7-
const int QK = 32;
8-
97
// usage:
108
// ./llama-quantize models/llama/ggml-model.bin models/llama/ggml-model-quant.bin type
119
//
@@ -39,7 +37,7 @@ int main(int argc, char ** argv) {
3937
{
4038
const int64_t t_start_us = ggml_time_us();
4139

42-
if (llama_model_quantize(fname_inp.c_str(), fname_out.c_str(), itype, QK)) {
40+
if (llama_model_quantize(fname_inp.c_str(), fname_out.c_str(), itype)) {
4341
fprintf(stderr, "%s: failed to quantize model from '%s'\n", __func__, fname_inp.c_str());
4442
return 1;
4543
}

0 commit comments

Comments
 (0)