Update README.md
Browse files
README.md
CHANGED
|
@@ -18,7 +18,7 @@ def _get_qwen3_prompt_embeds(...):
|
|
| 18 |
...
|
| 19 |
image_features = vision_model.get_image_features(image_path)
|
| 20 |
output = text_encoder(
|
| 21 |
-
|
| 22 |
attention_mask=attention_mask,
|
| 23 |
output_hidden_states=True,
|
| 24 |
use_cache=False,
|
|
@@ -37,3 +37,13 @@ pipeline = Flux2KleinPipeline.from_pretrained(flux2_path, torch_dtype=torch.bflo
|
|
| 37 |
- 2510.17800
|
| 38 |
- 2510.18279
|
| 39 |
- 2601.14251
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 18 |
...
|
| 19 |
image_features = vision_model.get_image_features(image_path)
|
| 20 |
output = text_encoder(
|
| 21 |
+
inputs_embeds=embedder(image_features),
|
| 22 |
attention_mask=attention_mask,
|
| 23 |
output_hidden_states=True,
|
| 24 |
use_cache=False,
|
|
|
|
| 37 |
- 2510.17800
|
| 38 |
- 2510.18279
|
| 39 |
- 2601.14251
|
| 40 |
+
|
| 41 |
+
## Datasets
|
| 42 |
+
|
| 43 |
+
- artbench-pd-256x256
|
| 44 |
+
- anime-art-multicaptions (multicharacter interactions)
|
| 45 |
+
- laion
|
| 46 |
+
- spatial-caption
|
| 47 |
+
- spright-coco
|
| 48 |
+
- z-image-ethnicity-test
|
| 49 |
+
- benchmarks from the Qwen-Image Technical Report
|