import asyncio import os os.environ['MODELSCOPE_ENVIRONMENT'] = '' from app import chat_completions, ChatCompletionRequest async def run_once(): req = ChatCompletionRequest(model='rwkv-latest', prompt='Who is the president of France today?', stream=False, max_tokens=32, temperature=0.2, include_usage=True) res = await chat_completions(req) print(res) if __name__ == '__main__': asyncio.run(run_once())