Spaces:
Paused
Paused
Commit
·
63b9057
1
Parent(s):
526ff2e
Fixed req file
Browse files- .gitignore +14 -27
- main/logs/llm_api.log +19 -0
- requirements.txt +19 -27
.gitignore
CHANGED
@@ -1,14 +1,7 @@
|
|
1 |
-
># Environment files
|
2 |
-
.env
|
3 |
-
.env.*
|
4 |
-
|
5 |
# Virtual environment
|
6 |
myenv/
|
7 |
venv/
|
8 |
-
|
9 |
-
|
10 |
-
# Model checkpoints
|
11 |
-
checkpoints/
|
12 |
|
13 |
# Python
|
14 |
__pycache__/
|
@@ -16,30 +9,24 @@ __pycache__/
|
|
16 |
*$py.class
|
17 |
*.so
|
18 |
.Python
|
19 |
-
|
20 |
-
|
21 |
dist/
|
22 |
-
|
23 |
eggs/
|
24 |
-
.eggs/
|
25 |
-
lib/
|
26 |
-
lib64/
|
27 |
-
parts/
|
28 |
-
sdist/
|
29 |
-
var/
|
30 |
-
wheels/
|
31 |
*.egg-info/
|
32 |
-
.
|
33 |
-
|
|
|
|
|
|
|
34 |
|
35 |
# IDE
|
36 |
-
.idea/
|
37 |
.vscode/
|
|
|
38 |
*.swp
|
39 |
-
|
40 |
-
.DS_Store
|
41 |
|
42 |
-
#
|
43 |
-
|
44 |
-
|
45 |
-
.cache/
|
|
|
|
|
|
|
|
|
|
|
1 |
# Virtual environment
|
2 |
myenv/
|
3 |
venv/
|
4 |
+
env/
|
|
|
|
|
|
|
5 |
|
6 |
# Python
|
7 |
__pycache__/
|
|
|
9 |
*$py.class
|
10 |
*.so
|
11 |
.Python
|
12 |
+
*.egg
|
13 |
+
*.egg-info/
|
14 |
dist/
|
15 |
+
build/
|
16 |
eggs/
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
17 |
*.egg-info/
|
18 |
+
.eggs/
|
19 |
+
|
20 |
+
# Models
|
21 |
+
models/
|
22 |
+
main/models/
|
23 |
|
24 |
# IDE
|
|
|
25 |
.vscode/
|
26 |
+
.idea/
|
27 |
*.swp
|
28 |
+
*~
|
|
|
29 |
|
30 |
+
# OS
|
31 |
+
.DS_Store
|
32 |
+
Thumbs.db
|
|
main/logs/llm_api.log
ADDED
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
2025-01-09 15:54:08,215 - hf_validation - WARNING - No .env file found. Fine if you're on Huggingface, but you need one to run locally on your PC.
|
2 |
+
2025-01-09 15:54:08,215 - hf_validation - ERROR - No HF_TOKEN found in environment variables
|
3 |
+
2025-01-09 15:54:08,215 - main - INFO - Starting LLM API server
|
4 |
+
2025-01-09 15:54:08,216 - llm_api - INFO - Initializing LLM API
|
5 |
+
2025-01-09 15:54:08,216 - llm_api - INFO - LLM API initialized successfully
|
6 |
+
2025-01-09 15:54:08,216 - api_routes - INFO - Router initialized with LLM API instance
|
7 |
+
2025-01-09 15:54:08,218 - main - INFO - FastAPI application created successfully
|
8 |
+
2025-01-09 16:46:10,118 - api_routes - INFO - Received request to download model: microsoft/phi-4
|
9 |
+
2025-01-09 16:46:10,118 - llm_api - INFO - Starting download of model: microsoft/phi-4
|
10 |
+
2025-01-09 16:46:10,118 - llm_api - INFO - Enabling stdout logging for download
|
11 |
+
2025-01-09 17:00:32,400 - llm_api - INFO - Disabling stdout logging
|
12 |
+
2025-01-09 17:00:32,400 - llm_api - INFO - Saving model to main/models/phi-4
|
13 |
+
2025-01-09 17:02:39,928 - llm_api - INFO - Successfully downloaded model: microsoft/phi-4
|
14 |
+
2025-01-09 17:02:41,075 - api_routes - INFO - Successfully downloaded model: microsoft/phi-4
|
15 |
+
2025-01-09 17:02:41,080 - api_routes - INFO - Received request to initialize model: huihui-ai/Qwen2.5-Coder-32B-Instruct-abliterated
|
16 |
+
2025-01-09 17:02:41,080 - llm_api - INFO - Initializing generation model: huihui-ai/Qwen2.5-Coder-32B-Instruct-abliterated
|
17 |
+
2025-01-09 17:02:41,081 - llm_api - INFO - Loading model from source: huihui-ai/Qwen2.5-Coder-32B-Instruct-abliterated
|
18 |
+
2025-01-09 17:02:41,377 - llm_api - ERROR - Failed to initialize generation model huihui-ai/Qwen2.5-Coder-32B-Instruct-abliterated: Using `low_cpu_mem_usage=True` or a `device_map` requires Accelerate: `pip install 'accelerate>=0.26.0'`
|
19 |
+
2025-01-09 17:02:41,377 - api_routes - ERROR - Error initializing model: Using `low_cpu_mem_usage=True` or a `device_map` requires Accelerate: `pip install 'accelerate>=0.26.0'`
|
requirements.txt
CHANGED
@@ -1,22 +1,20 @@
|
|
1 |
-
accelerate==1.
|
2 |
annotated-types==0.7.0
|
3 |
-
anyio==4.
|
4 |
-
|
5 |
-
|
6 |
-
|
7 |
-
|
8 |
-
fastapi==0.115.5
|
9 |
filelock==3.16.1
|
10 |
-
fsspec==2024.
|
11 |
h11==0.14.0
|
12 |
-
huggingface-hub==0.
|
13 |
idna==3.10
|
14 |
-
|
15 |
-
Jinja2==3.1.4
|
16 |
MarkupSafe==3.0.2
|
17 |
mpmath==1.3.0
|
18 |
networkx==3.4.2
|
19 |
-
numpy==2.1
|
20 |
nvidia-cublas-cu12==12.4.5.8
|
21 |
nvidia-cuda-cupti-cu12==12.4.127
|
22 |
nvidia-cuda-nvrtc-cu12==12.4.127
|
@@ -30,28 +28,22 @@ nvidia-nccl-cu12==2.21.5
|
|
30 |
nvidia-nvjitlink-cu12==12.4.127
|
31 |
nvidia-nvtx-cu12==12.4.127
|
32 |
packaging==24.2
|
33 |
-
|
34 |
-
|
35 |
-
|
36 |
-
pydantic==2.10.2
|
37 |
-
pydantic_core==2.27.1
|
38 |
python-dotenv==1.0.1
|
39 |
PyYAML==6.0.2
|
40 |
regex==2024.11.6
|
41 |
requests==2.32.3
|
42 |
-
|
43 |
-
|
44 |
-
setuptools==75.6.0
|
45 |
sniffio==1.3.1
|
46 |
starlette==0.41.3
|
47 |
sympy==1.13.1
|
48 |
-
tokenizers==0.
|
49 |
torch==2.5.1
|
50 |
tqdm==4.67.1
|
51 |
-
transformers==4.
|
52 |
-
triton==3.1.0
|
53 |
typing_extensions==4.12.2
|
54 |
-
urllib3==2.
|
55 |
-
|
56 |
-
uvicorn==0.32.1
|
57 |
-
wcwidth==0.2.13
|
|
|
1 |
+
accelerate==1.2.1
|
2 |
annotated-types==0.7.0
|
3 |
+
anyio==4.8.0
|
4 |
+
certifi==2024.12.14
|
5 |
+
charset-normalizer==3.4.1
|
6 |
+
click==8.1.8
|
7 |
+
fastapi==0.115.6
|
|
|
8 |
filelock==3.16.1
|
9 |
+
fsspec==2024.12.0
|
10 |
h11==0.14.0
|
11 |
+
huggingface-hub==0.27.1
|
12 |
idna==3.10
|
13 |
+
Jinja2==3.1.5
|
|
|
14 |
MarkupSafe==3.0.2
|
15 |
mpmath==1.3.0
|
16 |
networkx==3.4.2
|
17 |
+
numpy==2.2.1
|
18 |
nvidia-cublas-cu12==12.4.5.8
|
19 |
nvidia-cuda-cupti-cu12==12.4.127
|
20 |
nvidia-cuda-nvrtc-cu12==12.4.127
|
|
|
28 |
nvidia-nvjitlink-cu12==12.4.127
|
29 |
nvidia-nvtx-cu12==12.4.127
|
30 |
packaging==24.2
|
31 |
+
psutil==6.1.1
|
32 |
+
pydantic==2.10.5
|
33 |
+
pydantic_core==2.27.2
|
|
|
|
|
34 |
python-dotenv==1.0.1
|
35 |
PyYAML==6.0.2
|
36 |
regex==2024.11.6
|
37 |
requests==2.32.3
|
38 |
+
safetensors==0.5.2
|
39 |
+
setuptools==75.8.0
|
|
|
40 |
sniffio==1.3.1
|
41 |
starlette==0.41.3
|
42 |
sympy==1.13.1
|
43 |
+
tokenizers==0.21.0
|
44 |
torch==2.5.1
|
45 |
tqdm==4.67.1
|
46 |
+
transformers==4.47.1
|
|
|
47 |
typing_extensions==4.12.2
|
48 |
+
urllib3==2.3.0
|
49 |
+
uvicorn==0.34.0
|
|
|
|