#!/usr/bin/env python # -*- coding: utf-8 -*- """ Object pointing example using Rex Omni """ import matplotlib.pyplot as plt import torch from PIL import Image from rex_omni import RexOmniVisualize, RexOmniWrapper def main(): # Model path - replace with your actual model path model_path = "IDEA-Research/Rex-Omni" print("🚀 Initializing Rex Omni model...") # Create wrapper with custom parameters rex_model = RexOmniWrapper( model_path=model_path, backend="transformers", # Choose "transformers" or "vllm" max_tokens=2048, temperature=0.0, top_p=0.05, top_k=1, repetition_penalty=1.05, ) # Load image image_path = "tutorials/visual_prompting_example/test_images/pigeons.jpeg" # Replace with your image path image = Image.open(image_path).convert("RGB") print(f"✅ Image loaded successfully!") print(f"📏 Image size: {image.size}") visual_prompts = [ [644, 1210, 842, 1361], [1180, 1066, 1227, 1160], # Box 3: bottom region ] print("🎯 Performing object pointing...") results = rex_model.inference( images=image, task="visual_prompting", visual_prompt_boxes=visual_prompts, ) # Process results result = results[0] if result["success"]: predictions = result["extracted_predictions"] vis_image = RexOmniVisualize( image=image, predictions=predictions, font_size=30, draw_width=10, show_labels=True, ) # Save visualization output_path = ( "tutorials/visual_prompting_example/test_images/pigeons_visualize.jpg" ) vis_image.save(output_path) else: print(f"❌ Inference failed: {result['error']}") if __name__ == "__main__": main()