johnpaulbin commited on
Commit
5b5db10
·
verified ·
1 Parent(s): e0d55af

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -17,7 +17,7 @@ llm = Llama(
17
  model_path=base_model_path,
18
  lora_path=adapter_path,
19
  n_ctx=256, # Reduced context length (adjust based on your needs)
20
- n_threads=8, # Use all available CPU cores (adjust based on your system)
21
  n_gpu_layers=0, # Enable GPU acceleration (adjust based on VRAM)
22
  use_mmap=False, # Disable memory mapping for faster access
23
  use_mlock=True, # Lock model in memory for stability
 
17
  model_path=base_model_path,
18
  lora_path=adapter_path,
19
  n_ctx=256, # Reduced context length (adjust based on your needs)
20
+ n_threads=2, # Use all available CPU cores (adjust based on your system)
21
  n_gpu_layers=0, # Enable GPU acceleration (adjust based on VRAM)
22
  use_mmap=False, # Disable memory mapping for faster access
23
  use_mlock=True, # Lock model in memory for stability