shikibu9419 commited on
Commit
e0447d4
·
0 Parent(s):

Add PoC Code

Browse files
Files changed (3) hide show
  1. Pipfile +16 -0
  2. Pipfile.lock +253 -0
  3. app.py +83 -0
Pipfile ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [scripts]
2
+ dev = "uvicorn app:app --port=8000 --host=0.0.0.0"
3
+
4
+ [[source]]
5
+ url = "https://pypi.org/simple"
6
+ verify_ssl = true
7
+ name = "pypi"
8
+
9
+ [packages]
10
+ fastapi = "*"
11
+ groq = "*"
12
+ uvicorn = "*"
13
+ async-timeout = "*"
14
+ sse-starlette = "*"
15
+
16
+ [dev-packages]
Pipfile.lock ADDED
@@ -0,0 +1,253 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_meta": {
3
+ "hash": {
4
+ "sha256": "05315b6be9cdd53948108843fd27d78fd0eddd908f19395b9a5022bd2fa2f481"
5
+ },
6
+ "pipfile-spec": 6,
7
+ "requires": {},
8
+ "sources": [
9
+ {
10
+ "name": "pypi",
11
+ "url": "https://pypi.org/simple",
12
+ "verify_ssl": true
13
+ }
14
+ ]
15
+ },
16
+ "default": {
17
+ "annotated-types": {
18
+ "hashes": [
19
+ "sha256:0641064de18ba7a25dee8f96403ebc39113d0cb953a01429249d5c7564666a43",
20
+ "sha256:563339e807e53ffd9c267e99fc6d9ea23eb8443c08f112651963e24e22f84a5d"
21
+ ],
22
+ "markers": "python_version >= '3.8'",
23
+ "version": "==0.6.0"
24
+ },
25
+ "anyio": {
26
+ "hashes": [
27
+ "sha256:048e05d0f6caeed70d731f3db756d35dcc1f35747c8c403364a8332c630441b8",
28
+ "sha256:f75253795a87df48568485fd18cdd2a3fa5c4f7c5be8e5e36637733fce06fed6"
29
+ ],
30
+ "markers": "python_version >= '3.8'",
31
+ "version": "==4.3.0"
32
+ },
33
+ "async-timeout": {
34
+ "hashes": [
35
+ "sha256:4640d96be84d82d02ed59ea2b7105a0f7b33abe8703703cd0ab0bf87c427522f",
36
+ "sha256:7405140ff1230c310e51dc27b3145b9092d659ce68ff733fb0cefe3ee42be028"
37
+ ],
38
+ "index": "pypi",
39
+ "markers": "python_version >= '3.7'",
40
+ "version": "==4.0.3"
41
+ },
42
+ "certifi": {
43
+ "hashes": [
44
+ "sha256:0569859f95fc761b18b45ef421b1290a0f65f147e92a1e5eb3e635f9a5e4e66f",
45
+ "sha256:dc383c07b76109f368f6106eee2b593b04a011ea4d55f652c6ca24a754d1cdd1"
46
+ ],
47
+ "markers": "python_version >= '3.6'",
48
+ "version": "==2024.2.2"
49
+ },
50
+ "click": {
51
+ "hashes": [
52
+ "sha256:ae74fb96c20a0277a1d615f1e4d73c8414f5a98db8b799a7931d1582f3390c28",
53
+ "sha256:ca9853ad459e787e2192211578cc907e7594e294c7ccc834310722b41b9ca6de"
54
+ ],
55
+ "markers": "python_version >= '3.7'",
56
+ "version": "==8.1.7"
57
+ },
58
+ "distro": {
59
+ "hashes": [
60
+ "sha256:2fa77c6fd8940f116ee1d6b94a2f90b13b5ea8d019b98bc8bafdcabcdd9bdbed",
61
+ "sha256:7bffd925d65168f85027d8da9af6bddab658135b840670a223589bc0c8ef02b2"
62
+ ],
63
+ "markers": "python_version >= '3.6'",
64
+ "version": "==1.9.0"
65
+ },
66
+ "fastapi": {
67
+ "hashes": [
68
+ "sha256:266775f0dcc95af9d3ef39bad55cff525329a931d5fd51930aadd4f428bf7ff3",
69
+ "sha256:87a1f6fb632a218222c5984be540055346a8f5d8a68e8f6fb647b1dc9934de4b"
70
+ ],
71
+ "index": "pypi",
72
+ "markers": "python_version >= '3.8'",
73
+ "version": "==0.110.0"
74
+ },
75
+ "groq": {
76
+ "hashes": [
77
+ "sha256:2939ff96e3fc633416e5d9ab26bbfd63c70b2226338a507f8c2b0b3aa27c9dec",
78
+ "sha256:f2285c0a7d64abefcdec3d61e8bc1a61ff04d887ed30b991ac7fe53ae1e10251"
79
+ ],
80
+ "index": "pypi",
81
+ "markers": "python_version >= '3.7'",
82
+ "version": "==0.4.1"
83
+ },
84
+ "h11": {
85
+ "hashes": [
86
+ "sha256:8f19fbbe99e72420ff35c00b27a34cb9937e902a8b810e2c88300c6f0a3b699d",
87
+ "sha256:e3fe4ac4b851c468cc8363d500db52c2ead036020723024a109d37346efaa761"
88
+ ],
89
+ "markers": "python_version >= '3.7'",
90
+ "version": "==0.14.0"
91
+ },
92
+ "httpcore": {
93
+ "hashes": [
94
+ "sha256:ac418c1db41bade2ad53ae2f3834a3a0f5ae76b56cf5aa497d2d033384fc7d73",
95
+ "sha256:cb2839ccfcba0d2d3c1131d3c3e26dfc327326fbe7a5dc0dbfe9f6c9151bb022"
96
+ ],
97
+ "markers": "python_version >= '3.8'",
98
+ "version": "==1.0.4"
99
+ },
100
+ "httpx": {
101
+ "hashes": [
102
+ "sha256:71d5465162c13681bff01ad59b2cc68dd838ea1f10e51574bac27103f00c91a5",
103
+ "sha256:a0cb88a46f32dc874e04ee956e4c2764aba2aa228f650b06788ba6bda2962ab5"
104
+ ],
105
+ "markers": "python_version >= '3.8'",
106
+ "version": "==0.27.0"
107
+ },
108
+ "idna": {
109
+ "hashes": [
110
+ "sha256:9ecdbbd083b06798ae1e86adcbfe8ab1479cf864e4ee30fe4e46a003d12491ca",
111
+ "sha256:c05567e9c24a6b9faaa835c4821bad0590fbb9d5779e7caa6e1cc4978e7eb24f"
112
+ ],
113
+ "markers": "python_version >= '3.5'",
114
+ "version": "==3.6"
115
+ },
116
+ "pydantic": {
117
+ "hashes": [
118
+ "sha256:37a5432e54b12fecaa1049c5195f3d860a10e01bdfd24f1840ef14bd0d3aeab3",
119
+ "sha256:a09be1c3d28f3abe37f8a78af58284b236a92ce520105ddc91a6d29ea1176ba7"
120
+ ],
121
+ "markers": "python_version >= '3.8'",
122
+ "version": "==2.6.2"
123
+ },
124
+ "pydantic-core": {
125
+ "hashes": [
126
+ "sha256:00ee1c97b5364b84cb0bd82e9bbf645d5e2871fb8c58059d158412fee2d33d8a",
127
+ "sha256:0d32576b1de5a30d9a97f300cc6a3f4694c428d956adbc7e6e2f9cad279e45ed",
128
+ "sha256:0df446663464884297c793874573549229f9eca73b59360878f382a0fc085979",
129
+ "sha256:0f56ae86b60ea987ae8bcd6654a887238fd53d1384f9b222ac457070b7ac4cff",
130
+ "sha256:13dcc4802961b5f843a9385fc821a0b0135e8c07fc3d9949fd49627c1a5e6ae5",
131
+ "sha256:162e498303d2b1c036b957a1278fa0899d02b2842f1ff901b6395104c5554a45",
132
+ "sha256:1b662180108c55dfbf1280d865b2d116633d436cfc0bba82323554873967b340",
133
+ "sha256:1cac689f80a3abab2d3c0048b29eea5751114054f032a941a32de4c852c59cad",
134
+ "sha256:21b888c973e4f26b7a96491c0965a8a312e13be108022ee510248fe379a5fa23",
135
+ "sha256:287073c66748f624be4cef893ef9174e3eb88fe0b8a78dc22e88eca4bc357ca6",
136
+ "sha256:2a1ef6a36fdbf71538142ed604ad19b82f67b05749512e47f247a6ddd06afdc7",
137
+ "sha256:2a72fb9963cba4cd5793854fd12f4cfee731e86df140f59ff52a49b3552db241",
138
+ "sha256:2acca2be4bb2f2147ada8cac612f8a98fc09f41c89f87add7256ad27332c2fda",
139
+ "sha256:2f583bd01bbfbff4eaee0868e6fc607efdfcc2b03c1c766b06a707abbc856187",
140
+ "sha256:33809aebac276089b78db106ee692bdc9044710e26f24a9a2eaa35a0f9fa70ba",
141
+ "sha256:36fa178aacbc277bc6b62a2c3da95226520da4f4e9e206fdf076484363895d2c",
142
+ "sha256:4204e773b4b408062960e65468d5346bdfe139247ee5f1ca2a378983e11388a2",
143
+ "sha256:4384a8f68ddb31a0b0c3deae88765f5868a1b9148939c3f4121233314ad5532c",
144
+ "sha256:456855f57b413f077dff513a5a28ed838dbbb15082ba00f80750377eed23d132",
145
+ "sha256:49d5d58abd4b83fb8ce763be7794d09b2f50f10aa65c0f0c1696c677edeb7cbf",
146
+ "sha256:4ac6b4ce1e7283d715c4b729d8f9dab9627586dafce81d9eaa009dd7f25dd972",
147
+ "sha256:4df8a199d9f6afc5ae9a65f8f95ee52cae389a8c6b20163762bde0426275b7db",
148
+ "sha256:500960cb3a0543a724a81ba859da816e8cf01b0e6aaeedf2c3775d12ee49cade",
149
+ "sha256:519ae0312616026bf4cedc0fe459e982734f3ca82ee8c7246c19b650b60a5ee4",
150
+ "sha256:578114bc803a4c1ff9946d977c221e4376620a46cf78da267d946397dc9514a8",
151
+ "sha256:5c5cbc703168d1b7a838668998308018a2718c2130595e8e190220238addc96f",
152
+ "sha256:6162f8d2dc27ba21027f261e4fa26f8bcb3cf9784b7f9499466a311ac284b5b9",
153
+ "sha256:704d35ecc7e9c31d48926150afada60401c55efa3b46cd1ded5a01bdffaf1d48",
154
+ "sha256:716b542728d4c742353448765aa7cdaa519a7b82f9564130e2b3f6766018c9ec",
155
+ "sha256:72282ad4892a9fb2da25defeac8c2e84352c108705c972db82ab121d15f14e6d",
156
+ "sha256:7233d65d9d651242a68801159763d09e9ec96e8a158dbf118dc090cd77a104c9",
157
+ "sha256:732da3243e1b8d3eab8c6ae23ae6a58548849d2e4a4e03a1924c8ddf71a387cb",
158
+ "sha256:75b81e678d1c1ede0785c7f46690621e4c6e63ccd9192af1f0bd9d504bbb6bf4",
159
+ "sha256:75f76ee558751746d6a38f89d60b6228fa174e5172d143886af0f85aa306fd89",
160
+ "sha256:7ee8d5f878dccb6d499ba4d30d757111847b6849ae07acdd1205fffa1fc1253c",
161
+ "sha256:7f752826b5b8361193df55afcdf8ca6a57d0232653494ba473630a83ba50d8c9",
162
+ "sha256:86b3d0033580bd6bbe07590152007275bd7af95f98eaa5bd36f3da219dcd93da",
163
+ "sha256:8d62da299c6ecb04df729e4b5c52dc0d53f4f8430b4492b93aa8de1f541c4aac",
164
+ "sha256:8e47755d8152c1ab5b55928ab422a76e2e7b22b5ed8e90a7d584268dd49e9c6b",
165
+ "sha256:9091632a25b8b87b9a605ec0e61f241c456e9248bfdcf7abdf344fdb169c81cf",
166
+ "sha256:936e5db01dd49476fa8f4383c259b8b1303d5dd5fb34c97de194560698cc2c5e",
167
+ "sha256:99b6add4c0b39a513d323d3b93bc173dac663c27b99860dd5bf491b240d26137",
168
+ "sha256:9c865a7ee6f93783bd5d781af5a4c43dadc37053a5b42f7d18dc019f8c9d2bd1",
169
+ "sha256:a425479ee40ff021f8216c9d07a6a3b54b31c8267c6e17aa88b70d7ebd0e5e5b",
170
+ "sha256:a4b2bf78342c40b3dc830880106f54328928ff03e357935ad26c7128bbd66ce8",
171
+ "sha256:a6b1bb0827f56654b4437955555dc3aeeebeddc47c2d7ed575477f082622c49e",
172
+ "sha256:aaf09e615a0bf98d406657e0008e4a8701b11481840be7d31755dc9f97c44053",
173
+ "sha256:b1f6f5938d63c6139860f044e2538baeee6f0b251a1816e7adb6cbce106a1f01",
174
+ "sha256:b29eeb887aa931c2fcef5aa515d9d176d25006794610c264ddc114c053bf96fe",
175
+ "sha256:b3992a322a5617ded0a9f23fd06dbc1e4bd7cf39bc4ccf344b10f80af58beacd",
176
+ "sha256:b5b6079cc452a7c53dd378c6f881ac528246b3ac9aae0f8eef98498a75657805",
177
+ "sha256:b60cc1a081f80a2105a59385b92d82278b15d80ebb3adb200542ae165cd7d183",
178
+ "sha256:b926dd38db1519ed3043a4de50214e0d600d404099c3392f098a7f9d75029ff8",
179
+ "sha256:bd87f48924f360e5d1c5f770d6155ce0e7d83f7b4e10c2f9ec001c73cf475c99",
180
+ "sha256:bda1ee3e08252b8d41fa5537413ffdddd58fa73107171a126d3b9ff001b9b820",
181
+ "sha256:be0ec334369316fa73448cc8c982c01e5d2a81c95969d58b8f6e272884df0074",
182
+ "sha256:c6119dc90483a5cb50a1306adb8d52c66e447da88ea44f323e0ae1a5fcb14256",
183
+ "sha256:c9803edf8e29bd825f43481f19c37f50d2b01899448273b3a7758441b512acf8",
184
+ "sha256:c9bd22a2a639e26171068f8ebb5400ce2c1bc7d17959f60a3b753ae13c632975",
185
+ "sha256:cbcc558401de90a746d02ef330c528f2e668c83350f045833543cd57ecead1ad",
186
+ "sha256:cf6204fe865da605285c34cf1172879d0314ff267b1c35ff59de7154f35fdc2e",
187
+ "sha256:d33dd21f572545649f90c38c227cc8631268ba25c460b5569abebdd0ec5974ca",
188
+ "sha256:d89ca19cdd0dd5f31606a9329e309d4fcbb3df860960acec32630297d61820df",
189
+ "sha256:d8f99b147ff3fcf6b3cc60cb0c39ea443884d5559a30b1481e92495f2310ff2b",
190
+ "sha256:d937653a696465677ed583124b94a4b2d79f5e30b2c46115a68e482c6a591c8a",
191
+ "sha256:dcca5d2bf65c6fb591fff92da03f94cd4f315972f97c21975398bd4bd046854a",
192
+ "sha256:ded1c35f15c9dea16ead9bffcde9bb5c7c031bff076355dc58dcb1cb436c4721",
193
+ "sha256:e3e70c94a0c3841e6aa831edab1619ad5c511199be94d0c11ba75fe06efe107a",
194
+ "sha256:e56f8186d6210ac7ece503193ec84104da7ceb98f68ce18c07282fcc2452e76f",
195
+ "sha256:e7774b570e61cb998490c5235740d475413a1f6de823169b4cf94e2fe9e9f6b2",
196
+ "sha256:e7c6ed0dc9d8e65f24f5824291550139fe6f37fac03788d4580da0d33bc00c97",
197
+ "sha256:ec08be75bb268473677edb83ba71e7e74b43c008e4a7b1907c6d57e940bf34b6",
198
+ "sha256:ecdf6bf5f578615f2e985a5e1f6572e23aa632c4bd1dc67f8f406d445ac115ed",
199
+ "sha256:ed25e1835c00a332cb10c683cd39da96a719ab1dfc08427d476bce41b92531fc",
200
+ "sha256:f4cb85f693044e0f71f394ff76c98ddc1bc0953e48c061725e540396d5c8a2e1",
201
+ "sha256:f53aace168a2a10582e570b7736cc5bef12cae9cf21775e3eafac597e8551fbe",
202
+ "sha256:f651dd19363c632f4abe3480a7c87a9773be27cfe1341aef06e8759599454120",
203
+ "sha256:fc4ad7f7ee1a13d9cb49d8198cd7d7e3aa93e425f371a68235f784e99741561f",
204
+ "sha256:fee427241c2d9fb7192b658190f9f5fd6dfe41e02f3c1489d2ec1e6a5ab1e04a"
205
+ ],
206
+ "markers": "python_version >= '3.8'",
207
+ "version": "==2.16.3"
208
+ },
209
+ "sniffio": {
210
+ "hashes": [
211
+ "sha256:2f6da418d1f1e0fddd844478f41680e794e6051915791a034ff65e5f100525a2",
212
+ "sha256:f4324edc670a0f49750a81b895f35c3adb843cca46f0530f79fc1babb23789dc"
213
+ ],
214
+ "markers": "python_version >= '3.7'",
215
+ "version": "==1.3.1"
216
+ },
217
+ "sse-starlette": {
218
+ "hashes": [
219
+ "sha256:0c43cc43aca4884c88c8416b65777c4de874cc4773e6458d3579c0a353dc2fb7",
220
+ "sha256:c4dd134302cb9708d47cae23c365fe0a089aa2a875d2f887ac80f235a9ee5744"
221
+ ],
222
+ "index": "pypi",
223
+ "markers": "python_version >= '3.8'",
224
+ "version": "==2.0.0"
225
+ },
226
+ "starlette": {
227
+ "hashes": [
228
+ "sha256:13d429aa93a61dc40bf503e8c801db1f1bca3dc706b10ef2434a36123568f044",
229
+ "sha256:90a671733cfb35771d8cc605e0b679d23b992f8dcfad48cc60b38cb29aeb7080"
230
+ ],
231
+ "markers": "python_version >= '3.8'",
232
+ "version": "==0.36.3"
233
+ },
234
+ "typing-extensions": {
235
+ "hashes": [
236
+ "sha256:69b1a937c3a517342112fb4c6df7e72fc39a38e7891a5730ed4985b5214b5475",
237
+ "sha256:b0abd7c89e8fb96f98db18d86106ff1d90ab692004eb746cf6eda2682f91b3cb"
238
+ ],
239
+ "markers": "python_version >= '3.8'",
240
+ "version": "==4.10.0"
241
+ },
242
+ "uvicorn": {
243
+ "hashes": [
244
+ "sha256:3d9a267296243532db80c83a959a3400502165ade2c1338dea4e67915fd4745a",
245
+ "sha256:5c89da2f3895767472a35556e539fd59f7edbe9b1e9c0e1c99eebeadc61838e4"
246
+ ],
247
+ "index": "pypi",
248
+ "markers": "python_version >= '3.8'",
249
+ "version": "==0.27.1"
250
+ }
251
+ },
252
+ "develop": {}
253
+ }
app.py ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from fastapi import FastAPI, HTTPException, Header
2
+ from pydantic import BaseModel
3
+ from typing import List
4
+
5
+ from starlette.middleware.cors import CORSMiddleware
6
+ from sse_starlette.sse import EventSourceResponse
7
+
8
+ from groq import AsyncGroq, Groq
9
+ from groq.resources import Models
10
+ from groq.types import ModelList
11
+ from groq.types.chat.completion_create_params import Message
12
+
13
+ from json import dumps
14
+ import async_timeout
15
+ import asyncio
16
+
17
+ GENERATION_TIMEOUT_SEC = 60
18
+
19
+ app = FastAPI()
20
+ app.add_middleware(
21
+ CORSMiddleware,
22
+ allow_origins=["*"],
23
+ allow_credentials=True,
24
+ allow_methods=["*"],
25
+ allow_headers=["*"]
26
+ )
27
+
28
+
29
+ class ChatInput(BaseModel):
30
+ model: str
31
+ messages: List[Message]
32
+ stream: bool
33
+ temperature: float = 0
34
+ max_tokens: int = 100
35
+ user: str = "user"
36
+
37
+
38
+ async def get_groq_response(client: AsyncGroq, req: ChatInput):
39
+ async with async_timeout.timeout(GENERATION_TIMEOUT_SEC):
40
+ try:
41
+ stream = await client.chat.completions.create(
42
+ messages=req.messages,
43
+ model=req.model,
44
+ temperature=req.temperature,
45
+ max_tokens=req.max_tokens,
46
+ stream=req.stream,
47
+ )
48
+
49
+ async for chunk in stream:
50
+ yield {"data": dumps(chunk.dict())}
51
+
52
+ except asyncio.TimeoutError:
53
+ raise HTTPException(status_code=504, detail="Stream timed out")
54
+
55
+
56
+ @app.get("/models")
57
+ async def models(authorization: str = Header()) -> ModelList:
58
+ client = Groq(
59
+ api_key=authorization.split(" ")[-1],
60
+ )
61
+ models = Models(client=client).list()
62
+
63
+ return models
64
+
65
+
66
+ @app.post("/chat/completions")
67
+ async def completion(req: ChatInput, authorization: str = Header()):
68
+ client = AsyncGroq(
69
+ api_key=authorization.split(" ")[-1],
70
+ )
71
+
72
+ if req.stream:
73
+ return EventSourceResponse(get_groq_response(client, req))
74
+
75
+ response = await client.chat.completions.create(
76
+ messages=req.messages,
77
+ model=req.model,
78
+ temperature=req.temperature,
79
+ max_tokens=req.max_tokens,
80
+ stream=req.stream,
81
+ )
82
+
83
+ return response