TruVlad commited on
Commit
1335bf8
·
verified ·
1 Parent(s): 486a947

Upload folder using huggingface_hub

Browse files
Files changed (6) hide show
  1. Dockerfile +6 -2
  2. main.py +30 -3
  3. pull06.sh +16 -0
  4. pull14.sh +16 -0
  5. pull8.sh +16 -0
  6. start.sh +5 -4
Dockerfile CHANGED
@@ -25,8 +25,12 @@ ENV OLLAMA_LOAD_TIMEOUT="24h"
25
  RUN apt-get update && apt-get upgrade -y
26
  RUN apt-get install git g++ python3 python3-pip -y && apt-get clean
27
 
28
- COPY pull.sh pull.sh
29
- RUN /bin/bash -x pull.sh
 
 
 
 
30
 
31
  COPY requirements.txt requirements.txt
32
  RUN pip install --no-cache-dir -r requirements.txt --break-system-packages
 
25
  RUN apt-get update && apt-get upgrade -y
26
  RUN apt-get install git g++ python3 python3-pip -y && apt-get clean
27
 
28
+ COPY pull06.sh pull06.sh
29
+ RUN /bin/bash -x pull06.sh
30
+ COPY pull8.sh pull8.sh
31
+ RUN /bin/bash -x pull8.sh
32
+ # COPY pull14.sh pull.sh
33
+ # RUN /bin/bash -x pull14.sh
34
 
35
  COPY requirements.txt requirements.txt
36
  RUN pip install --no-cache-dir -r requirements.txt --break-system-packages
main.py CHANGED
@@ -82,7 +82,34 @@ def test_time():
82
  return '\n'.join(result)
83
 
84
 
85
- @app.route('/time14')
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
86
  def test_time14():
87
  from datetime import datetime
88
  from ollama import Client
@@ -96,7 +123,7 @@ def test_time14():
96
  'content': 'Расскажи о себе подробно',
97
  },
98
  ]
99
- response = chat('qwen3:30b', messages=messages)
100
  ansver.append(f' start {t_start} ')
101
  response_time=datetime.now()-t_start
102
  ansver.append(f' duration {response_time} ')
@@ -110,7 +137,7 @@ def test_time14():
110
  return '\n'.join(result)
111
 
112
 
113
- @app.route('/time30')
114
  def test_time30():
115
  from datetime import datetime
116
  from ollama import Client
 
82
  return '\n'.join(result)
83
 
84
 
85
+ @app.route('/time8')
86
+ def test_time8():
87
+ from datetime import datetime
88
+ from ollama import Client
89
+ from ollama import chat
90
+
91
+ t_start=datetime.now()
92
+ ansver = []
93
+ messages = [
94
+ {
95
+ 'role': 'user',
96
+ 'content': 'Расскажи о себе подробно',
97
+ },
98
+ ]
99
+ response = chat('qwen3:8b', messages=messages)
100
+ ansver.append(f' start {t_start} ')
101
+ response_time=datetime.now()-t_start
102
+ ansver.append(f' duration {response_time} ')
103
+ #
104
+ response_len = len(response['message']['content'])
105
+ ansver.append(f" lehgth {response_len}")
106
+ response_speed=response_len/int(response_time.seconds)
107
+ ansver.append(f" token/sek {response_len}")
108
+ ansver.append(response['message']['content'])
109
+ result = [f'<p>{answ}</p>' for answ in ansver ]
110
+ return '\n'.join(result)
111
+
112
+ #@app.route('/time14')
113
  def test_time14():
114
  from datetime import datetime
115
  from ollama import Client
 
123
  'content': 'Расскажи о себе подробно',
124
  },
125
  ]
126
+ response = chat('qwen3:14b', messages=messages)
127
  ansver.append(f' start {t_start} ')
128
  response_time=datetime.now()-t_start
129
  ansver.append(f' duration {response_time} ')
 
137
  return '\n'.join(result)
138
 
139
 
140
+ #@app.route('/time30')
141
  def test_time30():
142
  from datetime import datetime
143
  from ollama import Client
pull06.sh ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #/bin/bash
2
+ while true
3
+ do nohup ollama serve >/dev/null 2>&1
4
+ echo sleep 9
5
+ sleep 9
6
+ done >/dev/null 2>&1 &
7
+ echo sleep 5
8
+ sleep 5
9
+ # /usr/bin/ollama pull qwen3-next:80b
10
+ # /usr/bin/ollama pull qwen3-vl:235b
11
+ /usr/bin/ollama pull qwen3:0.6b
12
+ /usr/bin/ollama pull qwen3:8b
13
+ # /usr/bin/ollama pull qwen3:14b
14
+ # /usr/bin/ollama pull qwen3:30b
15
+ # /usr/bin/ollama pull qwen3.5:35b
16
+ /usr/bin/ollama list
pull14.sh ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #/bin/bash
2
+ while true
3
+ do nohup ollama serve >/dev/null 2>&1
4
+ echo sleep 9
5
+ sleep 9
6
+ done >/dev/null 2>&1 &
7
+ echo sleep 5
8
+ sleep 5
9
+ # /usr/bin/ollama pull qwen3-next:80b
10
+ # /usr/bin/ollama pull qwen3-vl:235b
11
+ # /usr/bin/ollama pull qwen3:0.6b
12
+ # /usr/bin/ollama pull qwen3:8b
13
+ /usr/bin/ollama pull qwen3:14b
14
+ # /usr/bin/ollama pull qwen3:30b
15
+ # /usr/bin/ollama pull qwen3.5:35b
16
+ /usr/bin/ollama list
pull8.sh ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #/bin/bash
2
+ while true
3
+ do nohup ollama serve >/dev/null 2>&1
4
+ echo sleep 9
5
+ sleep 9
6
+ done >/dev/null 2>&1 &
7
+ echo sleep 5
8
+ sleep 5
9
+ # /usr/bin/ollama pull qwen3-next:80b
10
+ # /usr/bin/ollama pull qwen3-vl:235b
11
+ /usr/bin/ollama pull qwen3:0.6b
12
+ # /usr/bin/ollama pull qwen3:8b
13
+ # /usr/bin/ollama pull qwen3:14b
14
+ # /usr/bin/ollama pull qwen3:30b
15
+ # /usr/bin/ollama pull qwen3.5:35b
16
+ /usr/bin/ollama list
start.sh CHANGED
@@ -1,11 +1,12 @@
1
  #/bin/bash
2
  while true
3
  do nohup ollama serve >/dev/null 2>&1
4
- echo sleep 9
5
- sleep 9
6
  done >/dev/null 2>&1 &
7
- echo sleep 30
8
- sleep 30
 
9
  echo list
10
  /usr/bin/ollama list
11
  python3 main.py
 
1
  #/bin/bash
2
  while true
3
  do nohup ollama serve >/dev/null 2>&1
4
+ echo sleep 4
5
+ sleep 4
6
  done >/dev/null 2>&1 &
7
+ echo sleep 3
8
+ sleep 3
9
+ /bin/bash pull14.sh
10
  echo list
11
  /usr/bin/ollama list
12
  python3 main.py