ggerganov commited on
Commit
648dff8
·
unverified ·
1 Parent(s): 1f461ff

whisper : add memory sizes for Q8_0 (close #846)

Browse files
Files changed (2) hide show
  1. examples/whisper.wasm/README.md +1 -1
  2. whisper.cpp +25 -16
examples/whisper.wasm/README.md CHANGED
@@ -37,6 +37,6 @@ emcmake cmake ..
37
  make -j
38
 
39
  # copy the produced page to your HTTP path
40
- cp bin/whisper.wasm/* /path/to/html/
41
  cp bin/libmain.worker.js /path/to/html/
42
  ```
 
37
  make -j
38
 
39
  # copy the produced page to your HTTP path
40
+ cp bin/whisper.wasm/* /path/to/html/
41
  cp bin/libmain.worker.js /path/to/html/
42
  ```
whisper.cpp CHANGED
@@ -284,11 +284,11 @@ static const std::map<ggml_type, std::map<e_model, size_t>> MEM_REQ_MODEL = {
284
  },
285
  { GGML_TYPE_Q4_1,
286
  {
287
- { MODEL_TINY, 31ull*MB },
288
- { MODEL_BASE, 57ull*MB },
289
- { MODEL_SMALL, 181ull*MB },
290
- { MODEL_MEDIUM, 559ull*MB },
291
- { MODEL_LARGE, 1122ull*MB },
292
  },
293
  },
294
  { GGML_TYPE_Q4_2,
@@ -300,22 +300,31 @@ static const std::map<ggml_type, std::map<e_model, size_t>> MEM_REQ_MODEL = {
300
  { MODEL_LARGE, 940ull*MB },
301
  },
302
  },
303
- { GGML_TYPE_Q5_0, // TODO: fix
304
  {
305
- { MODEL_TINY, 31ull*MB },
306
- { MODEL_BASE, 57ull*MB },
307
- { MODEL_SMALL, 181ull*MB },
308
- { MODEL_MEDIUM, 559ull*MB },
309
- { MODEL_LARGE, 1122ull*MB },
310
  },
311
  },
312
  { GGML_TYPE_Q5_1,
313
  {
314
- { MODEL_TINY, 31ull*MB },
315
- { MODEL_BASE, 57ull*MB },
316
- { MODEL_SMALL, 181ull*MB },
317
- { MODEL_MEDIUM, 559ull*MB },
318
- { MODEL_LARGE, 1122ull*MB },
 
 
 
 
 
 
 
 
 
319
  },
320
  },
321
  };
 
284
  },
285
  { GGML_TYPE_Q4_1,
286
  {
287
+ { MODEL_TINY, 32ull*MB },
288
+ { MODEL_BASE, 58ull*MB },
289
+ { MODEL_SMALL, 182ull*MB },
290
+ { MODEL_MEDIUM, 562ull*MB },
291
+ { MODEL_LARGE, 1124ull*MB },
292
  },
293
  },
294
  { GGML_TYPE_Q4_2,
 
300
  { MODEL_LARGE, 940ull*MB },
301
  },
302
  },
303
+ { GGML_TYPE_Q5_0,
304
  {
305
+ { MODEL_TINY, 30ull*MB },
306
+ { MODEL_BASE, 54ull*MB },
307
+ { MODEL_SMALL, 170ull*MB },
308
+ { MODEL_MEDIUM, 516ull*MB },
309
+ { MODEL_LARGE, 1034ull*MB },
310
  },
311
  },
312
  { GGML_TYPE_Q5_1,
313
  {
314
+ { MODEL_TINY, 32ull*MB },
315
+ { MODEL_BASE, 58ull*MB },
316
+ { MODEL_SMALL, 182ull*MB },
317
+ { MODEL_MEDIUM, 562ull*MB },
318
+ { MODEL_LARGE, 1124ull*MB },
319
+ },
320
+ },
321
+ { GGML_TYPE_Q8_0,
322
+ {
323
+ { MODEL_TINY, 45ull*MB },
324
+ { MODEL_BASE, 84ull*MB },
325
+ { MODEL_SMALL, 268ull*MB },
326
+ { MODEL_MEDIUM, 834ull*MB },
327
+ { MODEL_LARGE, 1674ull*MB },
328
  },
329
  },
330
  };