Tobias Bergmann commited on
Commit
80236d4
·
1 Parent(s): 60c26de

new server + thread settings

Browse files
Files changed (2) hide show
  1. app.py +2 -1
  2. llama-server +2 -2
app.py CHANGED
@@ -10,6 +10,7 @@ import requests
10
  import json
11
  import subprocess
12
  import gradio as gr
 
13
 
14
  today_date = datetime.today().strftime("%B %-d, %Y") # noqa: DTZ002
15
 
@@ -38,7 +39,7 @@ gguf_path = hf_hub_download(
38
 
39
  # start llama-server
40
  subprocess.run(["chmod", "+x", "llama-server"])
41
- command = ["./llama-server", "-m", "google_gemma-3-1b-it-IQ4_NL.gguf", "-ngl", "0", "--temp", "0.0", "-c", "2048", "-t", "8", "--port", "8081"]
42
  process = subprocess.Popen(command)
43
  print(f"Llama-server process started with PID {process.pid}")
44
 
 
10
  import json
11
  import subprocess
12
  import gradio as gr
13
+ import os
14
 
15
  today_date = datetime.today().strftime("%B %-d, %Y") # noqa: DTZ002
16
 
 
39
 
40
  # start llama-server
41
  subprocess.run(["chmod", "+x", "llama-server"])
42
+ command = ["./llama-server", "-m", "google_gemma-3-1b-it-IQ4_NL.gguf", "-ngl", "0", "--temp", "0.0", "-c", "2048", "-t", str(os.cpu_count()), "--port", "8081"]
43
  process = subprocess.Popen(command)
44
  print(f"Llama-server process started with PID {process.pid}")
45
 
llama-server CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ead85d6cb439c1f7abfcd987bd19e125471e0350e9035f2edbc2ec25af1014d
3
- size 6362744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8bb9756aaf882b0ee1d7da03347e58a9aa846ac4defde5d122633837c077749
3
+ size 6358592