Spaces:
Running
on
Zero
Running
on
Zero
| #!/usr/bin/env python | |
| # -*- coding: utf-8 -*- | |
| """ | |
| Object pointing example using Rex Omni | |
| """ | |
| import matplotlib.pyplot as plt | |
| import torch | |
| from PIL import Image | |
| from rex_omni import RexOmniVisualize, RexOmniWrapper | |
| def main(): | |
| # Model path - replace with your actual model path | |
| model_path = "IDEA-Research/Rex-Omni" | |
| print("π Initializing Rex Omni model...") | |
| # Create wrapper with custom parameters | |
| rex_model = RexOmniWrapper( | |
| model_path=model_path, | |
| backend="transformers", # Choose "transformers" or "vllm" | |
| max_tokens=2048, | |
| temperature=0.0, | |
| top_p=0.05, | |
| top_k=1, | |
| repetition_penalty=1.05, | |
| ) | |
| # Load image | |
| image_path = "tutorials/visual_prompting_example/test_images/pigeons.jpeg" # Replace with your image path | |
| image = Image.open(image_path).convert("RGB") | |
| print(f"β Image loaded successfully!") | |
| print(f"π Image size: {image.size}") | |
| visual_prompts = [ | |
| [644, 1210, 842, 1361], | |
| [1180, 1066, 1227, 1160], # Box 3: bottom region | |
| ] | |
| print("π― Performing object pointing...") | |
| results = rex_model.inference( | |
| images=image, | |
| task="visual_prompting", | |
| visual_prompt_boxes=visual_prompts, | |
| ) | |
| # Process results | |
| result = results[0] | |
| if result["success"]: | |
| predictions = result["extracted_predictions"] | |
| vis_image = RexOmniVisualize( | |
| image=image, | |
| predictions=predictions, | |
| font_size=30, | |
| draw_width=10, | |
| show_labels=True, | |
| ) | |
| # Save visualization | |
| output_path = ( | |
| "tutorials/visual_prompting_example/test_images/pigeons_visualize.jpg" | |
| ) | |
| vis_image.save(output_path) | |
| else: | |
| print(f"β Inference failed: {result['error']}") | |
| if __name__ == "__main__": | |
| main() | |