Image-Text-to-Text
Transformers
Safetensors
English
Chinese
qwen3_5
unsloth
fine tune
creative
creative writing
fiction writing
plot generation
sub-plot generation
story generation
scene continue
storytelling
fiction story
science fiction
romance
all genres
story
writing
vivid prosing
vivid writing
fiction
roleplaying
bfloat16
all use cases
conversational
| { | |
| "size": { | |
| "longest_edge": 25165824, | |
| "shortest_edge": 4096 | |
| }, | |
| "patch_size": 16, | |
| "temporal_patch_size": 2, | |
| "merge_size": 2, | |
| "image_mean": [ | |
| 0.5, | |
| 0.5, | |
| 0.5 | |
| ], | |
| "image_std": [ | |
| 0.5, | |
| 0.5, | |
| 0.5 | |
| ], | |
| "processor_class": "Qwen3VLProcessor", | |
| "video_processor_type": "Qwen3VLVideoProcessor" | |
| } |