khala / models /Megatron /tools /text_generation_cli.py
multimodalart's picture
multimodalart HF Staff
Initial best-effort ZeroGPU port of Khala song generation
d1f1097 verified
# Copyright (c) 2022, NVIDIA CORPORATION. All rights reserved.
import ast
import sys
import json
import requests
if __name__ == "__main__":
url = sys.argv[1]
url = 'http://' + url + '/api'
headers = {'Content-Type': 'application/json'}
while True:
sentence = input("Enter prompt: ")
tokens_to_generate = ast.literal_eval(input("Enter number of tokens to generate: "))
data = {"prompts": [sentence], "tokens_to_generate": tokens_to_generate}
response = requests.put(url, data=json.dumps(data), headers=headers)
if response.status_code != 200:
print(f"Error {response.status_code}: {response.json()['message']}")
else:
print("Megatron Response: ")
print(response.json()['text'][0])