TruVlad commited on
Commit
22a58da
·
verified ·
1 Parent(s): c97a86f

Upload folder using huggingface_hub

Browse files
Files changed (5) hide show
  1. Dockerfile +1 -0
  2. main.py +7 -36
  3. pull4.sh +16 -0
  4. pull8.sh +2 -2
  5. util.py +9 -8
Dockerfile CHANGED
@@ -35,6 +35,7 @@ COPY pull14.sh pull14.sh
35
 
36
  RUN pip install --no-cache-dir -r requirements.txt --break-system-packages
37
 
 
38
  COPY main.py main.py
39
  COPY util.py util.py
40
  COPY start.sh start.sh
 
35
 
36
  RUN pip install --no-cache-dir -r requirements.txt --break-system-packages
37
 
38
+ VOLUME vol1 vol2
39
  COPY main.py main.py
40
  COPY util.py util.py
41
  COPY start.sh start.sh
main.py CHANGED
@@ -17,7 +17,7 @@ def test_world():
17
  ansver = []
18
  for model in response.models:
19
  ansver.append(f'Name:{model.model}')
20
- ansver.append(f' Size (MB): {(model.size.real / 1024 / 1024):.2f}')
21
  if model.details:
22
  ansver.append(f' Format: {model.details.format}')
23
  ansver.append(f' Family: {model.details.family}')
@@ -42,52 +42,23 @@ def ps():
42
  ansver.append(f' Details: {model.details}')
43
  ansver.append(f' Context length: {model.context_length}')
44
  ansver.append(f'\n')
45
-
46
- response: ListResponse = ollist()
47
- for model in response.models:
48
- ansver.append(f'Name:{model.model}')
49
- ansver.append(f' Size (MB): {(model.size.real / 1024 / 1024):.2f}')
50
- if model.details:
51
- ansver.append(f' Format: {model.details.format}')
52
- ansver.append(f' Family: {model.details.family}')
53
- ansver.append(f' Parameter Size: {model.details.parameter_size}')
54
- ansver.append(f' Quantization Level:{model.details.quantization_level}')
55
  result = [f'<p>{answ}</p>' for answ in ansver ]
56
  return '\n'.join(result)
57
 
58
  @app.route('/time')
59
  def test_time():
60
- from datetime import datetime
61
- from ollama import Client
62
- from ollama import chat
63
-
64
- t_start=datetime.now()
65
- ansver = []
66
- messages = [
67
- {
68
- 'role': 'user',
69
- 'content': 'Расскажи о себе подробно',
70
- },
71
- ]
72
- response = chat('qwen3:0.6b', messages=messages)
73
- ansver.append(f' start {t_start} ')
74
- response_time=datetime.now()-t_start
75
- ansver.append(f' duration {response_time} ')
76
- #
77
- response_len = len(response['message']['content'])
78
- ansver.append(f" lehgth {response_len}")
79
- response_speed=response_len/int(response_time.seconds)
80
- ansver.append(f" token/sek {response_len}")
81
- ansver.append(response['message']['content'])
82
- result = [f'<p>{answ}</p>' for answ in ansver ]
83
- return '\n'.join(result)
84
 
85
 
 
 
 
 
86
  @app.route('/time8')
87
  def test_time8():
88
  return time_model('qwen3:8b')
89
 
90
- #@app.route('/time14')
91
  def test_time14():
92
  return time_model('qwen3:14b')
93
 
 
17
  ansver = []
18
  for model in response.models:
19
  ansver.append(f'Name:{model.model}')
20
+ ansver.append(f'\t Size (MB): {(model.size.real / 1024 / 1024):.2f}')
21
  if model.details:
22
  ansver.append(f' Format: {model.details.format}')
23
  ansver.append(f' Family: {model.details.family}')
 
42
  ansver.append(f' Details: {model.details}')
43
  ansver.append(f' Context length: {model.context_length}')
44
  ansver.append(f'\n')
 
 
 
 
 
 
 
 
 
 
45
  result = [f'<p>{answ}</p>' for answ in ansver ]
46
  return '\n'.join(result)
47
 
48
  @app.route('/time')
49
  def test_time():
50
+ return time_model('qwen3:0.6b')
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
51
 
52
 
53
+ @app.route('/tim4')
54
+ def test_time8():
55
+ return time_model('qwen3:4b')
56
+
57
  @app.route('/time8')
58
  def test_time8():
59
  return time_model('qwen3:8b')
60
 
61
+ @app.route('/time14')
62
  def test_time14():
63
  return time_model('qwen3:14b')
64
 
pull4.sh ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #/bin/bash
2
+ while true
3
+ do nohup ollama serve >/dev/null 2>&1
4
+ echo sleep 9
5
+ sleep 9
6
+ done >/dev/null 2>&1 &
7
+ echo sleep 5
8
+ sleep 5
9
+ # /usr/bin/ollama pull qwen3-next:80b
10
+ # /usr/bin/ollama pull qwen3-vl:235b
11
+ # /usr/bin/ollama pull qwen3:0.6b
12
+ /usr/bin/ollama pull qwen3:4b
13
+ # /usr/bin/ollama pull qwen3:14b
14
+ # /usr/bin/ollama pull qwen3:30b
15
+ # /usr/bin/ollama pull qwen3.5:35b
16
+ /usr/bin/ollama list
pull8.sh CHANGED
@@ -8,8 +8,8 @@ echo sleep 5
8
  sleep 5
9
  # /usr/bin/ollama pull qwen3-next:80b
10
  # /usr/bin/ollama pull qwen3-vl:235b
11
- /usr/bin/ollama pull qwen3:0.6b
12
- # /usr/bin/ollama pull qwen3:8b
13
  # /usr/bin/ollama pull qwen3:14b
14
  # /usr/bin/ollama pull qwen3:30b
15
  # /usr/bin/ollama pull qwen3.5:35b
 
8
  sleep 5
9
  # /usr/bin/ollama pull qwen3-next:80b
10
  # /usr/bin/ollama pull qwen3-vl:235b
11
+ # /usr/bin/ollama pull qwen3:0.6b
12
+ /usr/bin/ollama pull qwen3:8b
13
  # /usr/bin/ollama pull qwen3:14b
14
  # /usr/bin/ollama pull qwen3:30b
15
  # /usr/bin/ollama pull qwen3.5:35b
util.py CHANGED
@@ -9,12 +9,12 @@ def ps():
9
  response: ProcessResponse = ps()
10
  for model in response.models:
11
  ansver.append(f'Model: {model.model}')
12
- ansver.append(f' Digest: {model.digest}')
13
- ansver.append(f' Expires at: {model.expires_at}')
14
- ansver.append(f' Size: {model.size}')
15
- ansver.append(f' Size vram: {model.size_vram}')
16
- ansver.append(f' Details: {model.details}')
17
- ansver.append(f' Context length: {model.context_length}')
18
  ansver.append(f'\n')
19
  result = [f'<p>{answ}</p>' for answ in ansver ]
20
  return '\n'.join(result)
@@ -33,14 +33,15 @@ def time_model(model_name='qwen3:0.6b'):
33
  },
34
  ]
35
  response = chat(model_name, messages=messages)
 
36
  ansver.append(f' start {t_start} ')
37
  response_time=datetime.now()-t_start
38
  ansver.append(f' duration {response_time} ')
39
  #
40
  response_len = len(response['message']['content'])
41
- ansver.append(f" lehgth {response_len}")
42
  response_speed=response_len/int(response_time.seconds)
43
- ansver.append(f" token/sek {response_len}")
44
  ansver.append(response['message']['content'])
45
  result = [f'<p>{answ}</p>' for answ in ansver ]
46
  return '\n'.join(result)
 
9
  response: ProcessResponse = ps()
10
  for model in response.models:
11
  ansver.append(f'Model: {model.model}')
12
+ ansver.append(f'\t Digest: {model.digest}')
13
+ ansver.append(f'\t Expires at: {model.expires_at}')
14
+ ansver.append(f'\t Size: {model.size}')
15
+ ansver.append(f'\t Size vram: {model.size_vram}')
16
+ ansver.append(f'\t Details: {model.details}')
17
+ ansver.append(f'\t Context length: {model.context_length}')
18
  ansver.append(f'\n')
19
  result = [f'<p>{answ}</p>' for answ in ansver ]
20
  return '\n'.join(result)
 
33
  },
34
  ]
35
  response = chat(model_name, messages=messages)
36
+ ansver.append(f' <h3> {model_name}</h3>')
37
  ansver.append(f' start {t_start} ')
38
  response_time=datetime.now()-t_start
39
  ansver.append(f' duration {response_time} ')
40
  #
41
  response_len = len(response['message']['content'])
42
+ ansver.append(f' lehgth {response_len}')
43
  response_speed=response_len/int(response_time.seconds)
44
+ ansver.append(f' token/sek {response_len}')
45
  ansver.append(response['message']['content'])
46
  result = [f'<p>{answ}</p>' for answ in ansver ]
47
  return '\n'.join(result)