AurelioAguirre commited on
Commit
63b9057
·
1 Parent(s): 526ff2e

Fixed req file

Browse files
Files changed (3) hide show
  1. .gitignore +14 -27
  2. main/logs/llm_api.log +19 -0
  3. requirements.txt +19 -27
.gitignore CHANGED
@@ -1,14 +1,7 @@
1
- ># Environment files
2
- .env
3
- .env.*
4
-
5
  # Virtual environment
6
  myenv/
7
  venv/
8
- ENV/
9
-
10
- # Model checkpoints
11
- checkpoints/
12
 
13
  # Python
14
  __pycache__/
@@ -16,30 +9,24 @@ __pycache__/
16
  *$py.class
17
  *.so
18
  .Python
19
- build/
20
- develop-eggs/
21
  dist/
22
- downloads/
23
  eggs/
24
- .eggs/
25
- lib/
26
- lib64/
27
- parts/
28
- sdist/
29
- var/
30
- wheels/
31
  *.egg-info/
32
- .installed.cfg
33
- *.egg
 
 
 
34
 
35
  # IDE
36
- .idea/
37
  .vscode/
 
38
  *.swp
39
- *.swo
40
- .DS_Store
41
 
42
- # Logs
43
- *.log
44
- logs/
45
- .cache/
 
 
 
 
 
1
  # Virtual environment
2
  myenv/
3
  venv/
4
+ env/
 
 
 
5
 
6
  # Python
7
  __pycache__/
 
9
  *$py.class
10
  *.so
11
  .Python
12
+ *.egg
13
+ *.egg-info/
14
  dist/
15
+ build/
16
  eggs/
 
 
 
 
 
 
 
17
  *.egg-info/
18
+ .eggs/
19
+
20
+ # Models
21
+ models/
22
+ main/models/
23
 
24
  # IDE
 
25
  .vscode/
26
+ .idea/
27
  *.swp
28
+ *~
 
29
 
30
+ # OS
31
+ .DS_Store
32
+ Thumbs.db
 
main/logs/llm_api.log ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-01-09 15:54:08,215 - hf_validation - WARNING - No .env file found. Fine if you're on Huggingface, but you need one to run locally on your PC.
2
+ 2025-01-09 15:54:08,215 - hf_validation - ERROR - No HF_TOKEN found in environment variables
3
+ 2025-01-09 15:54:08,215 - main - INFO - Starting LLM API server
4
+ 2025-01-09 15:54:08,216 - llm_api - INFO - Initializing LLM API
5
+ 2025-01-09 15:54:08,216 - llm_api - INFO - LLM API initialized successfully
6
+ 2025-01-09 15:54:08,216 - api_routes - INFO - Router initialized with LLM API instance
7
+ 2025-01-09 15:54:08,218 - main - INFO - FastAPI application created successfully
8
+ 2025-01-09 16:46:10,118 - api_routes - INFO - Received request to download model: microsoft/phi-4
9
+ 2025-01-09 16:46:10,118 - llm_api - INFO - Starting download of model: microsoft/phi-4
10
+ 2025-01-09 16:46:10,118 - llm_api - INFO - Enabling stdout logging for download
11
+ 2025-01-09 17:00:32,400 - llm_api - INFO - Disabling stdout logging
12
+ 2025-01-09 17:00:32,400 - llm_api - INFO - Saving model to main/models/phi-4
13
+ 2025-01-09 17:02:39,928 - llm_api - INFO - Successfully downloaded model: microsoft/phi-4
14
+ 2025-01-09 17:02:41,075 - api_routes - INFO - Successfully downloaded model: microsoft/phi-4
15
+ 2025-01-09 17:02:41,080 - api_routes - INFO - Received request to initialize model: huihui-ai/Qwen2.5-Coder-32B-Instruct-abliterated
16
+ 2025-01-09 17:02:41,080 - llm_api - INFO - Initializing generation model: huihui-ai/Qwen2.5-Coder-32B-Instruct-abliterated
17
+ 2025-01-09 17:02:41,081 - llm_api - INFO - Loading model from source: huihui-ai/Qwen2.5-Coder-32B-Instruct-abliterated
18
+ 2025-01-09 17:02:41,377 - llm_api - ERROR - Failed to initialize generation model huihui-ai/Qwen2.5-Coder-32B-Instruct-abliterated: Using `low_cpu_mem_usage=True` or a `device_map` requires Accelerate: `pip install 'accelerate>=0.26.0'`
19
+ 2025-01-09 17:02:41,377 - api_routes - ERROR - Error initializing model: Using `low_cpu_mem_usage=True` or a `device_map` requires Accelerate: `pip install 'accelerate>=0.26.0'`
requirements.txt CHANGED
@@ -1,22 +1,20 @@
1
- accelerate==1.1.1
2
  annotated-types==0.7.0
3
- anyio==4.6.2.post1
4
- bitsandbytes==0.45.0
5
- certifi==2024.8.30
6
- charset-normalizer==3.4.0
7
- click==8.1.7
8
- fastapi==0.115.5
9
  filelock==3.16.1
10
- fsspec==2024.10.0
11
  h11==0.14.0
12
- huggingface-hub==0.26.3
13
  idna==3.10
14
- inquirerpy==0.3.4
15
- Jinja2==3.1.4
16
  MarkupSafe==3.0.2
17
  mpmath==1.3.0
18
  networkx==3.4.2
19
- numpy==2.1.3
20
  nvidia-cublas-cu12==12.4.5.8
21
  nvidia-cuda-cupti-cu12==12.4.127
22
  nvidia-cuda-nvrtc-cu12==12.4.127
@@ -30,28 +28,22 @@ nvidia-nccl-cu12==2.21.5
30
  nvidia-nvjitlink-cu12==12.4.127
31
  nvidia-nvtx-cu12==12.4.127
32
  packaging==24.2
33
- pfzy==0.3.4
34
- prompt_toolkit==3.0.48
35
- psutil==6.1.0
36
- pydantic==2.10.2
37
- pydantic_core==2.27.1
38
  python-dotenv==1.0.1
39
  PyYAML==6.0.2
40
  regex==2024.11.6
41
  requests==2.32.3
42
- router==0.1
43
- safetensors==0.4.5
44
- setuptools==75.6.0
45
  sniffio==1.3.1
46
  starlette==0.41.3
47
  sympy==1.13.1
48
- tokenizers==0.20.3
49
  torch==2.5.1
50
  tqdm==4.67.1
51
- transformers==4.46.3
52
- triton==3.1.0
53
  typing_extensions==4.12.2
54
- urllib3==2.2.3
55
- utils==1.0.2
56
- uvicorn==0.32.1
57
- wcwidth==0.2.13
 
1
+ accelerate==1.2.1
2
  annotated-types==0.7.0
3
+ anyio==4.8.0
4
+ certifi==2024.12.14
5
+ charset-normalizer==3.4.1
6
+ click==8.1.8
7
+ fastapi==0.115.6
 
8
  filelock==3.16.1
9
+ fsspec==2024.12.0
10
  h11==0.14.0
11
+ huggingface-hub==0.27.1
12
  idna==3.10
13
+ Jinja2==3.1.5
 
14
  MarkupSafe==3.0.2
15
  mpmath==1.3.0
16
  networkx==3.4.2
17
+ numpy==2.2.1
18
  nvidia-cublas-cu12==12.4.5.8
19
  nvidia-cuda-cupti-cu12==12.4.127
20
  nvidia-cuda-nvrtc-cu12==12.4.127
 
28
  nvidia-nvjitlink-cu12==12.4.127
29
  nvidia-nvtx-cu12==12.4.127
30
  packaging==24.2
31
+ psutil==6.1.1
32
+ pydantic==2.10.5
33
+ pydantic_core==2.27.2
 
 
34
  python-dotenv==1.0.1
35
  PyYAML==6.0.2
36
  regex==2024.11.6
37
  requests==2.32.3
38
+ safetensors==0.5.2
39
+ setuptools==75.8.0
 
40
  sniffio==1.3.1
41
  starlette==0.41.3
42
  sympy==1.13.1
43
+ tokenizers==0.21.0
44
  torch==2.5.1
45
  tqdm==4.67.1
46
+ transformers==4.47.1
 
47
  typing_extensions==4.12.2
48
+ urllib3==2.3.0
49
+ uvicorn==0.34.0