| """ | |
| Quick start example - Minimal code to run Qwen ONNX model | |
| """ | |
| import onnxruntime_genai as og | |
| from pathlib import Path | |
| # Point to your ONNX model directory | |
| MODEL_DIR = Path(__file__).parent | |
| # Load model and tokenizer | |
| print(f"Loading model from {MODEL_DIR}") | |
| model = og.Model(str(MODEL_DIR)) | |
| tokenizer = og.Tokenizer(model) | |
| # Simple text generation | |
| prompt = "Hello, how are you?" | |
| print(f"\nPrompt: {prompt}") | |
| # Encode input | |
| input_tokens = tokenizer.encode(prompt) | |
| # Setup generation parameters | |
| config = model.get_default_generation_search_parameters() | |
| config.max_length = 100 | |
| config.temperature = 0.6 | |
| # Generate | |
| generator = og.Generator(model, config) | |
| generator.append_tokens(input_tokens) | |
| while not generator.is_done(): | |
| generator.compute_logits() | |
| generator.generate_next_token() | |
| # Decode output | |
| output_tokens = generator.get_sequence(0) | |
| output_text = tokenizer.decode(output_tokens) | |
| print(f"Response: {output_text}") | |