Update README.md
Browse files
README.md
CHANGED
|
@@ -79,8 +79,8 @@ from transformers import Pix2StructForConditionalGeneration, Pix2StructProcessor
|
|
| 79 |
url = "https://www.ilankelman.org/stopsigns/australia.jpg"
|
| 80 |
image = Image.open(requests.get(url, stream=True).raw)
|
| 81 |
|
| 82 |
-
model = Pix2StructForConditionalGeneration.from_pretrained("
|
| 83 |
-
processor = Pix2StructProcessor.from_pretrained("
|
| 84 |
|
| 85 |
# image only
|
| 86 |
inputs = processor(images=image, return_tensors="pt")
|
|
@@ -101,8 +101,8 @@ from transformers import Pix2StructForConditionalGeneration, Pix2StructProcessor
|
|
| 101 |
url = "https://www.ilankelman.org/stopsigns/australia.jpg"
|
| 102 |
image = Image.open(requests.get(url, stream=True).raw)
|
| 103 |
|
| 104 |
-
model = Pix2StructForConditionalGeneration.from_pretrained("
|
| 105 |
-
processor = Pix2StructProcessor.from_pretrained("
|
| 106 |
|
| 107 |
# image only
|
| 108 |
inputs = processor(images=image, return_tensors="pt").to("cuda")
|
|
@@ -125,8 +125,8 @@ from transformers import Pix2StructForConditionalGeneration, Pix2StructProcessor
|
|
| 125 |
url = "https://www.ilankelman.org/stopsigns/australia.jpg"
|
| 126 |
image = Image.open(requests.get(url, stream=True).raw)
|
| 127 |
|
| 128 |
-
model = Pix2StructForConditionalGeneration.from_pretrained("
|
| 129 |
-
processor = Pix2StructProcessor.from_pretrained("
|
| 130 |
|
| 131 |
# image only
|
| 132 |
inputs = processor(images=image, return_tensors="pt").to("cuda", torch.bfloat16)
|
|
@@ -156,8 +156,8 @@ url = "https://www.ilankelman.org/stopsigns/australia.jpg"
|
|
| 156 |
image = Image.open(requests.get(url, stream=True).raw)
|
| 157 |
text = "A picture of"
|
| 158 |
|
| 159 |
-
model = Pix2StructForConditionalGeneration.from_pretrained("
|
| 160 |
-
processor = Pix2StructProcessor.from_pretrained("
|
| 161 |
|
| 162 |
# image only
|
| 163 |
inputs = processor(images=image, text=text, return_tensors="pt")
|
|
|
|
| 79 |
url = "https://www.ilankelman.org/stopsigns/australia.jpg"
|
| 80 |
image = Image.open(requests.get(url, stream=True).raw)
|
| 81 |
|
| 82 |
+
model = Pix2StructForConditionalGeneration.from_pretrained("google/pix2struct-textcaps-base")
|
| 83 |
+
processor = Pix2StructProcessor.from_pretrained("google/pix2struct-textcaps-base")
|
| 84 |
|
| 85 |
# image only
|
| 86 |
inputs = processor(images=image, return_tensors="pt")
|
|
|
|
| 101 |
url = "https://www.ilankelman.org/stopsigns/australia.jpg"
|
| 102 |
image = Image.open(requests.get(url, stream=True).raw)
|
| 103 |
|
| 104 |
+
model = Pix2StructForConditionalGeneration.from_pretrained("google/pix2struct-textcaps-base").to("cuda")
|
| 105 |
+
processor = Pix2StructProcessor.from_pretrained("google/pix2struct-textcaps-base")
|
| 106 |
|
| 107 |
# image only
|
| 108 |
inputs = processor(images=image, return_tensors="pt").to("cuda")
|
|
|
|
| 125 |
url = "https://www.ilankelman.org/stopsigns/australia.jpg"
|
| 126 |
image = Image.open(requests.get(url, stream=True).raw)
|
| 127 |
|
| 128 |
+
model = Pix2StructForConditionalGeneration.from_pretrained("google/pix2struct-textcaps-base", torch_dtype=torch.bfloat16).to("cuda")
|
| 129 |
+
processor = Pix2StructProcessor.from_pretrained("google/pix2struct-textcaps-base")
|
| 130 |
|
| 131 |
# image only
|
| 132 |
inputs = processor(images=image, return_tensors="pt").to("cuda", torch.bfloat16)
|
|
|
|
| 156 |
image = Image.open(requests.get(url, stream=True).raw)
|
| 157 |
text = "A picture of"
|
| 158 |
|
| 159 |
+
model = Pix2StructForConditionalGeneration.from_pretrained("google/pix2struct-textcaps-base")
|
| 160 |
+
processor = Pix2StructProcessor.from_pretrained("google/pix2struct-textcaps-base")
|
| 161 |
|
| 162 |
# image only
|
| 163 |
inputs = processor(images=image, text=text, return_tensors="pt")
|