Spaces:
Sleeping
Sleeping
Commit ·
6301fdd
1
Parent(s): 206fb58
Adding the openBLAS
Browse files- gguf_engine.py +2 -0
- packages.txt +1 -0
gguf_engine.py
CHANGED
|
@@ -92,6 +92,7 @@ def _load_text_model(adapter_name: str) -> Llama:
|
|
| 92 |
n_ctx = N_CTX,
|
| 93 |
n_batch = N_BATCH,
|
| 94 |
n_threads = N_THREADS,
|
|
|
|
| 95 |
use_mmap = True,
|
| 96 |
verbose = False,
|
| 97 |
)
|
|
@@ -125,6 +126,7 @@ def _load_vision_model(vision_module: str) -> Llama:
|
|
| 125 |
n_ctx = 1024,
|
| 126 |
n_batch = N_BATCH,
|
| 127 |
n_threads = N_THREADS,
|
|
|
|
| 128 |
use_mmap = True,
|
| 129 |
verbose = False,
|
| 130 |
)
|
|
|
|
| 92 |
n_ctx = N_CTX,
|
| 93 |
n_batch = N_BATCH,
|
| 94 |
n_threads = N_THREADS,
|
| 95 |
+
n_threads_batch=2, # Crucial for OpenBLAS prompt evaluation
|
| 96 |
use_mmap = True,
|
| 97 |
verbose = False,
|
| 98 |
)
|
|
|
|
| 126 |
n_ctx = 1024,
|
| 127 |
n_batch = N_BATCH,
|
| 128 |
n_threads = N_THREADS,
|
| 129 |
+
n_threads_batch=2, # Crucial for OpenBLAS prompt evaluation
|
| 130 |
use_mmap = True,
|
| 131 |
verbose = False,
|
| 132 |
)
|
packages.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
libopenblas0-pthread
|