QJMKWB commited on
Commit
26bc55c
·
verified ·
1 Parent(s): 1dfc44a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +14 -56
app.py CHANGED
@@ -1,68 +1,26 @@
1
  import os
2
  import subprocess
3
- import sys
4
 
5
- def install_dependencies():
6
- print("--- INŠTALÁCIA ZÁVISLOSTÍ (toto môže chvíľu trvať) ---")
7
- # Nastavenie pre kompiláciu llama-cpp
8
- os.environ["CMAKE_ARGS"] = "-DLLAMA_NATIVE=OFF"
9
-
10
- packages = [
11
- "huggingface_hub[hf-transfer]",
12
- "llama-cpp-python[server]"
13
- ]
14
-
15
- for package in packages:
16
- print(f"Inštalujem {package}...")
17
- subprocess.check_call([sys.executable, "-m", "pip", "install", "--no-cache-dir", package])
18
-
19
- print("--- INŠTALÁCIA DOKONČENÁ ---")
20
 
21
- def download_model():
22
- # Aktivujeme hf_transfer pre super rýchle sťahovanie
23
- os.environ["HF_HUB_ENABLE_HF_TRANSFER"] = "1"
24
- from huggingface_hub import hf_hub_download
25
-
26
- repo_id = "bartowski/Qwen2.5-Coder-7B-Instruct-GGUF"
27
- filename = "Qwen2.5-Coder-7B-Instruct-Q4_K_M.gguf"
28
-
29
- print(f"--- SŤAHUJEM MODEL: {filename} ---")
30
-
31
- # Stiahne model priamo do aktuálneho adresára
32
  model_path = hf_hub_download(
33
- repo_id=repo_id,
34
- filename=filename,
35
- local_dir=".",
36
- local_dir_use_symlinks=False
37
  )
38
- print(f"--- MODEL PRIPRAVENÝ: {model_path} ---")
39
- return filename
40
 
41
- def run_server(model_file):
42
- print("--- SPÚŠŤAM SERVER ---")
43
- command = [
44
- sys.executable, "-m", "llama_cpp.server",
45
- "--model", model_file,
46
  "--host", "0.0.0.0",
47
  "--port", "7860",
48
- "--chat_format", "chatml",
49
  "--n_ctx", "4096"
50
- ]
51
-
52
- # Spustenie servera tak, aby logy tiekli priamo do konzoly HF Spaces
53
- subprocess.run(command)
54
 
55
  if __name__ == "__main__":
56
- try:
57
- # 1. Inštalácia (ak už sú, pip ich preskočí)
58
- install_dependencies()
59
-
60
- # 2. Sťahovanie
61
- model_filename = download_model()
62
-
63
- # 3. Štart
64
- run_server(model_filename)
65
-
66
- except Exception as e:
67
- print(f"KRITICKÁ CHYBA: {e}")
68
- sys.exit(1)
 
1
  import os
2
  import subprocess
3
+ from huggingface_hub import hf_hub_download
4
 
5
+ # Rýchle sťahovanie
6
+ os.environ["HF_HUB_ENABLE_HF_TRANSFER"] = "1"
 
 
 
 
 
 
 
 
 
 
 
 
 
7
 
8
+ def run():
9
+ # Stiahneš model (už máš llama-cpp pripravené v systéme)
 
 
 
 
 
 
 
 
 
10
  model_path = hf_hub_download(
11
+ repo_id="bartowski/Qwen2.5-Coder-7B-Instruct-GGUF",
12
+ filename="Qwen2.5-Coder-7B-Instruct-Q4_K_M.gguf",
13
+ local_dir="."
 
14
  )
 
 
15
 
16
+ # Spustíš server
17
+ subprocess.run([
18
+ "python3", "-m", "llama_cpp.server",
19
+ "--model", "Qwen2.5-Coder-7B-Instruct-Q4_K_M.gguf",
 
20
  "--host", "0.0.0.0",
21
  "--port", "7860",
 
22
  "--n_ctx", "4096"
23
+ ])
 
 
 
24
 
25
  if __name__ == "__main__":
26
+ run()