File size: 614 Bytes
d2426db | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 | import requests
import json
url="http://localhost:1234/v1/chat/completions"
headers={
"Content-Type": "application/json"
}
payload={
"model" : "gemma-3-4b-it-qat-int4",
"messages":[
{
"role":"system",
"content":"help me in ml"
},
{
"role":"user",
"content":"hello"
}
],
"temprature":0.7,
"max_tokens":256,
"top_p":0.9,
"top_k":40,
"presence_penalty":0.0,
"frequency_penalty":0.0,
"stop":["\n"]
}
response=requests.post(url,headers=headers,data=json.dumps(payload))
print(response.json()) |