TruVlad commited on
Commit
440570c
·
verified ·
1 Parent(s): 430f613

Upload folder using huggingface_hub

Browse files
Files changed (5) hide show
  1. .util.py.kate-swp +0 -0
  2. Dockerfile +2 -2
  3. main.py +7 -74
  4. start.sh +1 -0
  5. util.py +168 -0
.util.py.kate-swp ADDED
Binary file (2.47 kB). View file
 
Dockerfile CHANGED
@@ -27,8 +27,8 @@ RUN apt-get install git g++ python3 python3-pip -y && apt-get clean
27
 
28
  COPY pull06.sh pull06.sh
29
  RUN /bin/bash -x pull06.sh
30
- COPY pull8.sh pull8.sh
31
- RUN /bin/bash -x pull8.sh
32
  # COPY pull14.sh pull14.sh
33
  # RUN /bin/bash -x pull14.sh
34
 
 
27
 
28
  COPY pull06.sh pull06.sh
29
  RUN /bin/bash -x pull06.sh
30
+ # COPY pull8.sh pull8.sh
31
+ # RUN /bin/bash -x pull8.sh
32
  # COPY pull14.sh pull14.sh
33
  # RUN /bin/bash -x pull14.sh
34
 
main.py CHANGED
@@ -1,5 +1,6 @@
1
  from flask import Flask
2
  import ollama
 
3
 
4
  app = Flask(__name__)
5
 
@@ -10,9 +11,9 @@ def hello_world():
10
 
11
  @app.route('/list')
12
  def test_world():
13
- from ollama import ListResponse, list
14
 
15
- response: ListResponse = list()
16
  ansver = []
17
  for model in response.models:
18
  ansver.append(f'Name:{model.model}')
@@ -42,7 +43,7 @@ def ps():
42
  ansver.append(f' Context length: {model.context_length}')
43
  ansver.append(f'\n')
44
 
45
- response: ListResponse = list()
46
  for model in response.models:
47
  ansver.append(f'Name:{model.model}')
48
  ansver.append(f' Size (MB): {(model.size.real / 1024 / 1024):.2f}')
@@ -84,85 +85,17 @@ def test_time():
84
 
85
  @app.route('/time8')
86
  def test_time8():
87
- from datetime import datetime
88
- from ollama import Client
89
- from ollama import chat
90
-
91
- t_start=datetime.now()
92
- ansver = []
93
- messages = [
94
- {
95
- 'role': 'user',
96
- 'content': 'Расскажи о себе подробно',
97
- },
98
- ]
99
- response = chat('qwen3:8b', messages=messages)
100
- ansver.append(f' start {t_start} ')
101
- response_time=datetime.now()-t_start
102
- ansver.append(f' duration {response_time} ')
103
- #
104
- response_len = len(response['message']['content'])
105
- ansver.append(f" lehgth {response_len}")
106
- response_speed=response_len/int(response_time.seconds)
107
- ansver.append(f" token/sek {response_len}")
108
- ansver.append(response['message']['content'])
109
- result = [f'<p>{answ}</p>' for answ in ansver ]
110
- return '\n'.join(result)
111
 
112
  #@app.route('/time14')
113
  def test_time14():
114
- from datetime import datetime
115
- from ollama import Client
116
- from ollama import chat
117
-
118
- t_start=datetime.now()
119
- ansver = []
120
- messages = [
121
- {
122
- 'role': 'user',
123
- 'content': 'Расскажи о себе подробно',
124
- },
125
- ]
126
- response = chat('qwen3:14b', messages=messages)
127
- ansver.append(f' start {t_start} ')
128
- response_time=datetime.now()-t_start
129
- ansver.append(f' duration {response_time} ')
130
- #
131
- response_len = len(response['message']['content'])
132
- ansver.append(f" lehgth {response_len}")
133
- response_speed=response_len/int(response_time.seconds)
134
- ansver.append(f" token/sek {response_len}")
135
- ansver.append(response['message']['content'])
136
- result = [f'<p>{answ}</p>' for answ in ansver ]
137
- return '\n'.join(result)
138
 
139
 
140
  #@app.route('/time30')
141
  def test_time30():
142
- from datetime import datetime
143
- from ollama import Client
144
- from ollama import chat
145
 
146
- t_start=datetime.now()
147
- ansver = []
148
- messages = [
149
- {
150
- 'role': 'user',
151
- 'content': 'Расскажи о себе подробно',
152
- },
153
- ]
154
- response = chat('qwen3:30b', messages=messages)
155
- ansver.append(f' start {t_start} ')
156
- response_time=datetime.now()-t_start
157
- ansver.append(f' duration {response_time} ')
158
- #
159
- response_len = len(response['message']['content'])
160
- ansver.append(f" lehgth {response_len}")
161
- response_speed=response_len/int(response_time.seconds)
162
- ansver.append(f" token/sek {response_len}")
163
- ansver.append(response['message']['content'])
164
- result = [f'<p>{answ}</p>' for answ in ansver ]
165
- return '\n'.join(result)
166
 
167
  if __name__ == '__main__':
168
  app.run(host='0.0.0.0', port="7860")
 
1
  from flask import Flask
2
  import ollama
3
+ from util import time_model
4
 
5
  app = Flask(__name__)
6
 
 
11
 
12
  @app.route('/list')
13
  def test_world():
14
+ from ollama import ListResponse, list as ollist
15
 
16
+ response: ListResponse = ollist()
17
  ansver = []
18
  for model in response.models:
19
  ansver.append(f'Name:{model.model}')
 
43
  ansver.append(f' Context length: {model.context_length}')
44
  ansver.append(f'\n')
45
 
46
+ response: ListResponse = ollist()
47
  for model in response.models:
48
  ansver.append(f'Name:{model.model}')
49
  ansver.append(f' Size (MB): {(model.size.real / 1024 / 1024):.2f}')
 
85
 
86
  @app.route('/time8')
87
  def test_time8():
88
+ return time_model('qwen3:8b')
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
89
 
90
  #@app.route('/time14')
91
  def test_time14():
92
+ return time_model('qwen3:14b')
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
93
 
94
 
95
  #@app.route('/time30')
96
  def test_time30():
97
+ return time_model('qwen3:30b')
 
 
98
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
99
 
100
  if __name__ == '__main__':
101
  app.run(host='0.0.0.0', port="7860")
start.sh CHANGED
@@ -6,6 +6,7 @@ while true
6
  done >/dev/null 2>&1 &
7
  echo sleep 3
8
  sleep 3
 
9
  /bin/bash pull14.sh
10
  echo list
11
  /usr/bin/ollama list
 
6
  done >/dev/null 2>&1 &
7
  echo sleep 3
8
  sleep 3
9
+ /bin/bash pull8.sh
10
  /bin/bash pull14.sh
11
  echo list
12
  /usr/bin/ollama list
util.py ADDED
@@ -0,0 +1,168 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from flask import Flask
2
+ import ollama
3
+
4
+ app = Flask(__name__)
5
+
6
+ @app.route('/')
7
+ def hello_world():
8
+ return "<h1>Hello, World!<h1>"
9
+
10
+
11
+ @app.route('/list')
12
+ def test_world():
13
+ from ollama import ListResponse, list
14
+
15
+ response: ListResponse = list()
16
+ ansver = []
17
+ for model in response.models:
18
+ ansver.append(f'Name:{model.model}')
19
+ ansver.append(f' Size (MB): {(model.size.real / 1024 / 1024):.2f}')
20
+ if model.details:
21
+ ansver.append(f' Format: {model.details.format}')
22
+ ansver.append(f' Family: {model.details.family}')
23
+ ansver.append(f' Parameter Size: {model.details.parameter_size}')
24
+ ansver.append(f' Quantization Level:{model.details.quantization_level}')
25
+ result = [f'<p>{answ}</p>' for answ in ansver ]
26
+ return '\n'.join(result)
27
+
28
+
29
+ @app.route('/ps')
30
+ def ps():
31
+ from ollama import ProcessResponse, chat, ps, pull
32
+ ansver = []
33
+
34
+ response: ProcessResponse = ps()
35
+ for model in response.models:
36
+ ansver.append(f'Model: {model.model}')
37
+ ansver.append(f' Digest: {model.digest}')
38
+ ansver.append(f' Expires at: {model.expires_at}')
39
+ ansver.append(f' Size: {model.size}')
40
+ ansver.append(f' Size vram: {model.size_vram}')
41
+ ansver.append(f' Details: {model.details}')
42
+ ansver.append(f' Context length: {model.context_length}')
43
+ ansver.append(f'\n')
44
+
45
+ response: ListResponse = list()
46
+ for model in response.models:
47
+ ansver.append(f'Name:{model.model}')
48
+ ansver.append(f' Size (MB): {(model.size.real / 1024 / 1024):.2f}')
49
+ if model.details:
50
+ ansver.append(f' Format: {model.details.format}')
51
+ ansver.append(f' Family: {model.details.family}')
52
+ ansver.append(f' Parameter Size: {model.details.parameter_size}')
53
+ ansver.append(f' Quantization Level:{model.details.quantization_level}')
54
+ result = [f'<p>{answ}</p>' for answ in ansver ]
55
+ return '\n'.join(result)
56
+
57
+ @app.route('/time')
58
+ def test_time():
59
+ from datetime import datetime
60
+ from ollama import Client
61
+ from ollama import chat
62
+
63
+ t_start=datetime.now()
64
+ ansver = []
65
+ messages = [
66
+ {
67
+ 'role': 'user',
68
+ 'content': 'Расскажи о себе подробно',
69
+ },
70
+ ]
71
+ response = chat('qwen3:0.6b', messages=messages)
72
+ ansver.append(f' start {t_start} ')
73
+ response_time=datetime.now()-t_start
74
+ ansver.append(f' duration {response_time} ')
75
+ #
76
+ response_len = len(response['message']['content'])
77
+ ansver.append(f" lehgth {response_len}")
78
+ response_speed=response_len/int(response_time.seconds)
79
+ ansver.append(f" token/sek {response_len}")
80
+ ansver.append(response['message']['content'])
81
+ result = [f'<p>{answ}</p>' for answ in ansver ]
82
+ return '\n'.join(result)
83
+
84
+
85
+ @app.route('/time8')
86
+ def test_time8():
87
+ from datetime import datetime
88
+ from ollama import Client
89
+ from ollama import chat
90
+
91
+ t_start=datetime.now()
92
+ ansver = []
93
+ messages = [
94
+ {
95
+ 'role': 'user',
96
+ 'content': 'Расскажи о себе подробно',
97
+ },
98
+ ]
99
+ response = chat('qwen3:8b', messages=messages)
100
+ ansver.append(f' start {t_start} ')
101
+ response_time=datetime.now()-t_start
102
+ ansver.append(f' duration {response_time} ')
103
+ #
104
+ response_len = len(response['message']['content'])
105
+ ansver.append(f" lehgth {response_len}")
106
+ response_speed=response_len/int(response_time.seconds)
107
+ ansver.append(f" token/sek {response_len}")
108
+ ansver.append(response['message']['content'])
109
+ result = [f'<p>{answ}</p>' for answ in ansver ]
110
+ return '\n'.join(result)
111
+
112
+ #@app.route('/time14')
113
+ def test_time14():
114
+ from datetime import datetime
115
+ from ollama import Client
116
+ from ollama import chat
117
+
118
+ t_start=datetime.now()
119
+ ansver = []
120
+ messages = [
121
+ {
122
+ 'role': 'user',
123
+ 'content': 'Расскажи о себе подробно',
124
+ },
125
+ ]
126
+ response = chat('qwen3:14b', messages=messages)
127
+ ansver.append(f' start {t_start} ')
128
+ response_time=datetime.now()-t_start
129
+ ansver.append(f' duration {response_time} ')
130
+ #
131
+ response_len = len(response['message']['content'])
132
+ ansver.append(f" lehgth {response_len}")
133
+ response_speed=response_len/int(response_time.seconds)
134
+ ansver.append(f" token/sek {response_len}")
135
+ ansver.append(response['message']['content'])
136
+ result = [f'<p>{answ}</p>' for answ in ansver ]
137
+ return '\n'.join(result)
138
+
139
+
140
+ #@app.route('/time30')
141
+ def test_time30():
142
+ from datetime import datetime
143
+ from ollama import Client
144
+ from ollama import chat
145
+
146
+ t_start=datetime.now()
147
+ ansver = []
148
+ messages = [
149
+ {
150
+ 'role': 'user',
151
+ 'content': 'Расскажи о себе подробно',
152
+ },
153
+ ]
154
+ response = chat('qwen3:30b', messages=messages)
155
+ ansver.append(f' start {t_start} ')
156
+ response_time=datetime.now()-t_start
157
+ ansver.append(f' duration {response_time} ')
158
+ #
159
+ response_len = len(response['message']['content'])
160
+ ansver.append(f" lehgth {response_len}")
161
+ response_speed=response_len/int(response_time.seconds)
162
+ ansver.append(f" token/sek {response_len}")
163
+ ansver.append(response['message']['content'])
164
+ result = [f'<p>{answ}</p>' for answ in ansver ]
165
+ return '\n'.join(result)
166
+
167
+ if __name__ == '__main__':
168
+ app.run(host='0.0.0.0', port="7860")