TruVlad commited on
Commit
bcaf6d9
·
verified ·
1 Parent(s): 9088a98

Upload folder using huggingface_hub

Browse files
Files changed (4) hide show
  1. Dockerfile +2 -0
  2. main.py +7 -9
  3. start.sh +1 -0
  4. util.py +2 -2
Dockerfile CHANGED
@@ -28,6 +28,8 @@ RUN apt-get install git g++ python3 python3-pip -y && apt-get clean
28
  COPY requirements.txt requirements.txt
29
  COPY pull06.sh pull06.sh
30
  RUN /bin/bash -x pull06.sh
 
 
31
  COPY pull8.sh pull8.sh
32
  # RUN /bin/bash -x pull8.sh
33
  COPY pull14.sh pull14.sh
 
28
  COPY requirements.txt requirements.txt
29
  COPY pull06.sh pull06.sh
30
  RUN /bin/bash -x pull06.sh
31
+
32
+ COPY pull4.sh pull4.sh
33
  COPY pull8.sh pull8.sh
34
  # RUN /bin/bash -x pull8.sh
35
  COPY pull14.sh pull14.sh
main.py CHANGED
@@ -16,13 +16,13 @@ def test_world():
16
  response: ListResponse = ollist()
17
  ansver = []
18
  for model in response.models:
19
- ansver.append(f'Name:{model.model}')
20
  ansver.append(f'\t Size (MB): {(model.size.real / 1024 / 1024):.2f}')
21
  if model.details:
22
- ansver.append(f' Format: {model.details.format}')
23
- ansver.append(f' Family: {model.details.family}')
24
- ansver.append(f' Parameter Size: {model.details.parameter_size}')
25
- ansver.append(f' Quantization Level:{model.details.quantization_level}')
26
  result = [f'<p>{answ}</p>' for answ in ansver ]
27
  return '\n'.join(result)
28
 
@@ -31,10 +31,9 @@ def test_world():
31
  def ps():
32
  from ollama import ProcessResponse, chat, ps, pull
33
  ansver = []
34
-
35
  response: ProcessResponse = ps()
36
  for model in response.models:
37
- ansver.append(f'Model: {model.model}')
38
  ansver.append(f' Digest: {model.digest}')
39
  ansver.append(f' Expires at: {model.expires_at}')
40
  ansver.append(f' Size: {model.size}')
@@ -49,8 +48,7 @@ def ps():
49
  def test_time():
50
  return time_model('qwen3:0.6b')
51
 
52
-
53
- @app.route('/tim4')
54
  def test_time4():
55
  return time_model('qwen3:4b')
56
 
 
16
  response: ListResponse = ollist()
17
  ansver = []
18
  for model in response.models:
19
+ ansver.append(f'<h4>Name:{model.model}</h4>')
20
  ansver.append(f'\t Size (MB): {(model.size.real / 1024 / 1024):.2f}')
21
  if model.details:
22
+ ansver.append(f'\t Format: {model.details.format}')
23
+ ansver.append(f'\t Family: {model.details.family}')
24
+ ansver.append(f'\t Parameter Size: {model.details.parameter_size}')
25
+ ansver.append(f'\t Quantization Level:{model.details.quantization_level}')
26
  result = [f'<p>{answ}</p>' for answ in ansver ]
27
  return '\n'.join(result)
28
 
 
31
  def ps():
32
  from ollama import ProcessResponse, chat, ps, pull
33
  ansver = []
 
34
  response: ProcessResponse = ps()
35
  for model in response.models:
36
+ ansver.append(f'<h4>Model</h4>: {model.model}')
37
  ansver.append(f' Digest: {model.digest}')
38
  ansver.append(f' Expires at: {model.expires_at}')
39
  ansver.append(f' Size: {model.size}')
 
48
  def test_time():
49
  return time_model('qwen3:0.6b')
50
 
51
+ @app.route('/time4')
 
52
  def test_time4():
53
  return time_model('qwen3:4b')
54
 
start.sh CHANGED
@@ -6,6 +6,7 @@ while true
6
  done >/dev/null 2>&1 &
7
  echo sleep 3
8
  sleep 3
 
9
  /bin/bash pull8.sh
10
  /bin/bash pull14.sh
11
  python3 main.py
 
6
  done >/dev/null 2>&1 &
7
  echo sleep 3
8
  sleep 3
9
+ /bin/bash pull4.sh
10
  /bin/bash pull8.sh
11
  /bin/bash pull14.sh
12
  python3 main.py
util.py CHANGED
@@ -8,7 +8,7 @@ def ps():
8
 
9
  response: ProcessResponse = ps()
10
  for model in response.models:
11
- ansver.append(f'Model: {model.model}')
12
  ansver.append(f'\t Digest: {model.digest}')
13
  ansver.append(f'\t Expires at: {model.expires_at}')
14
  ansver.append(f'\t Size: {model.size}')
@@ -41,7 +41,7 @@ def time_model(model_name='qwen3:0.6b'):
41
  response_len = len(response['message']['content'])
42
  ansver.append(f' lehgth {response_len}')
43
  response_speed=response_len/int(response_time.seconds)
44
- ansver.append(f' token/sek {response_len}')
45
  ansver.append(response['message']['content'])
46
  result = [f'<p>{answ}</p>' for answ in ansver ]
47
  return '\n'.join(result)
 
8
 
9
  response: ProcessResponse = ps()
10
  for model in response.models:
11
+ ansver.append(f'<h3>Mode<h3>: {model.model}')
12
  ansver.append(f'\t Digest: {model.digest}')
13
  ansver.append(f'\t Expires at: {model.expires_at}')
14
  ansver.append(f'\t Size: {model.size}')
 
41
  response_len = len(response['message']['content'])
42
  ansver.append(f' lehgth {response_len}')
43
  response_speed=response_len/int(response_time.seconds)
44
+ ansver.append(f' token/sek {response_speed}')
45
  ansver.append(response['message']['content'])
46
  result = [f'<p>{answ}</p>' for answ in ansver ]
47
  return '\n'.join(result)