Upload model files

Files changed (7) hide show

README.md CHANGED Viewed

@@ -28,6 +28,35 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
 import torch
 # load model
-model = AutoModelForCausalLM.from_pretrained("Ricky06662/Seg-Zero-7B")
-tokenizer = AutoTokenizer.from_pretrained("Ricky06662/Seg-Zero-7B")
 ```

 import torch
 # load model
+model = Qwen2_5_VLForConditionalGeneration.from_pretrained("Ricky06662/Seg-Zero-7B")
+tokenizer = Qwen2_5_VLForConditionalGeneration.from_pretrained("Ricky06662/Seg-Zero-7B")
+```
+## Installation
+```bash
+git clone https://github.com/dvlab-research/Seg-Zero.git
+cd Seg-Zero
+conda create -n seg_zero python=3.11
+conda activate seg_zero
+pip install torch==2.5.1 torchvision==0.20.1 torchaudio==2.5.1
+pip install -e .
+pip install sam2
+pip install matplotlib
+```
+## Inference
+```bash
+python inference_scripts/infer.py
+```
+The default question is:
+> "the unusual object in the image."
+You will get the thinking process in the command line and the mask will be saved in the **inference_scripts** folder.  You can also provide your own image_path and text:
+```bash
+python inference_scripts/infer.py --image_path "your_image_path" --text "your question text"
 ```

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "/gpfs/yuqiliu/easyr1_workdir/17_run_qwen2_5_vl_7b_refcocog_add_boxl1_kl5e-3_lr1e-6_strict_format_n16/global_step_200/actor/huggingface",
   "architectures": [
     "Qwen2_5_VLForConditionalGeneration"
   ],

 {
+  "_name_or_path": "/gpfs/yuqiliu/easyr1_workdir/22_run_qwen2_5_vl_7b_refcocog_add_boxl1_kl1e-2_lr1e-6_strict_format_n8/global_step_562/actor/huggingface",
   "architectures": [
     "Qwen2_5_VLForConditionalGeneration"
   ],

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:02189a5030533563cb97d46618c6084d7e128be0295c0f5f772d6ce3c68e7e49
-size 4871753400

 version https://git-lfs.github.com/spec/v1
+oid sha256:38c48425cee36ddfd4fbbc0b2993f36f06fa4ac8e460c1b79be0b59efc953fdd
+size 4888372856

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:29462384d6a68a2a4ffa78f3428ac8f54a135b55dbc423df7b9544f376fa5d4d
-size 4914744112

 version https://git-lfs.github.com/spec/v1
+oid sha256:139ba86b1b9750588060df19471bbcaf4735933e90e98c0433bd7d965397f591
+size 4930885376

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a6dd4184e10f0ec424ce8c316636e0fcc1c219f2e88cd8df3054d0ec135e68a2
-size 4932899656

 version https://git-lfs.github.com/spec/v1
+oid sha256:9d2fd346eb88c8164a9c4c34fef43aa15d9b913ae1f21d2c1d408ccd487fa992
+size 4490074192

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:97fa285dd3928ef072ce48012fe78927ba2fcf6f70d02cd397c9f19fcc2933d7
-size 1865017328

 version https://git-lfs.github.com/spec/v1
+oid sha256:1d33376846110acadfe1735ebd6309a20235a365289a2b599b75a37c9d2a51ef
+size 2275082104

model.safetensors.index.json CHANGED Viewed

The diff for this file is too large to render. See raw diff