Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -17,7 +17,7 @@ llm = Llama(
|
|
17 |
model_path=base_model_path,
|
18 |
lora_path=adapter_path,
|
19 |
n_ctx=256, # Reduced context length (adjust based on your needs)
|
20 |
-
n_threads=
|
21 |
n_gpu_layers=0, # Enable GPU acceleration (adjust based on VRAM)
|
22 |
use_mmap=False, # Disable memory mapping for faster access
|
23 |
use_mlock=True, # Lock model in memory for stability
|
|
|
17 |
model_path=base_model_path,
|
18 |
lora_path=adapter_path,
|
19 |
n_ctx=256, # Reduced context length (adjust based on your needs)
|
20 |
+
n_threads=2, # Use all available CPU cores (adjust based on your system)
|
21 |
n_gpu_layers=0, # Enable GPU acceleration (adjust based on VRAM)
|
22 |
use_mmap=False, # Disable memory mapping for faster access
|
23 |
use_mlock=True, # Lock model in memory for stability
|