Spaces:
Running
Running
Tobias Bergmann
commited on
Commit
·
80236d4
1
Parent(s):
60c26de
new server + thread settings
Browse files- app.py +2 -1
- llama-server +2 -2
app.py
CHANGED
@@ -10,6 +10,7 @@ import requests
|
|
10 |
import json
|
11 |
import subprocess
|
12 |
import gradio as gr
|
|
|
13 |
|
14 |
today_date = datetime.today().strftime("%B %-d, %Y") # noqa: DTZ002
|
15 |
|
@@ -38,7 +39,7 @@ gguf_path = hf_hub_download(
|
|
38 |
|
39 |
# start llama-server
|
40 |
subprocess.run(["chmod", "+x", "llama-server"])
|
41 |
-
command = ["./llama-server", "-m", "google_gemma-3-1b-it-IQ4_NL.gguf", "-ngl", "0", "--temp", "0.0", "-c", "2048", "-t",
|
42 |
process = subprocess.Popen(command)
|
43 |
print(f"Llama-server process started with PID {process.pid}")
|
44 |
|
|
|
10 |
import json
|
11 |
import subprocess
|
12 |
import gradio as gr
|
13 |
+
import os
|
14 |
|
15 |
today_date = datetime.today().strftime("%B %-d, %Y") # noqa: DTZ002
|
16 |
|
|
|
39 |
|
40 |
# start llama-server
|
41 |
subprocess.run(["chmod", "+x", "llama-server"])
|
42 |
+
command = ["./llama-server", "-m", "google_gemma-3-1b-it-IQ4_NL.gguf", "-ngl", "0", "--temp", "0.0", "-c", "2048", "-t", str(os.cpu_count()), "--port", "8081"]
|
43 |
process = subprocess.Popen(command)
|
44 |
print(f"Llama-server process started with PID {process.pid}")
|
45 |
|
llama-server
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8bb9756aaf882b0ee1d7da03347e58a9aa846ac4defde5d122633837c077749
|
3 |
+
size 6358592
|