Update app.py
Browse files
app.py
CHANGED
|
@@ -4,36 +4,16 @@ from diffusers import Flux2Pipeline
|
|
| 4 |
|
| 5 |
pipe = Flux2Pipeline.from_pretrained(
|
| 6 |
"black-forest-labs/FLUX.2-klein-4B",
|
| 7 |
-
|
| 8 |
-
|
| 9 |
-
scheduler=None,
|
| 10 |
-
safety_checker=None,
|
| 11 |
-
feature_extractor=None,
|
| 12 |
)
|
| 13 |
|
| 14 |
-
tokenizer = pipe.tokenizer
|
| 15 |
-
text_encoder = pipe.text_encoder
|
| 16 |
-
|
| 17 |
def encode_text(prompt: str):
|
| 18 |
-
inputs = tokenizer(
|
| 19 |
-
prompt,
|
| 20 |
-
return_tensors="pt",
|
| 21 |
-
padding=True,
|
| 22 |
-
truncation=True,
|
| 23 |
-
max_length=512,
|
| 24 |
-
)
|
| 25 |
-
|
| 26 |
with torch.inference_mode():
|
| 27 |
-
|
| 28 |
-
**inputs,
|
| 29 |
-
output_hidden_states=True,
|
| 30 |
-
use_cache=False,
|
| 31 |
-
)
|
| 32 |
-
|
| 33 |
-
embeds = outputs.hidden_states[-1] # [B, L, 4096]
|
| 34 |
|
| 35 |
-
torch.save(
|
| 36 |
-
return f"shape={tuple(
|
| 37 |
|
| 38 |
demo = gr.Interface(
|
| 39 |
fn=encode_text,
|
|
|
|
| 4 |
|
| 5 |
pipe = Flux2Pipeline.from_pretrained(
|
| 6 |
"black-forest-labs/FLUX.2-klein-4B",
|
| 7 |
+
torch_dtype=torch.float32,
|
| 8 |
+
low_cpu_mem_usage=True,
|
|
|
|
|
|
|
|
|
|
| 9 |
)
|
| 10 |
|
|
|
|
|
|
|
|
|
|
| 11 |
def encode_text(prompt: str):
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 12 |
with torch.inference_mode():
|
| 13 |
+
prompt_embeds = pipe.encode_prompt(prompt) # [B, L, 2560] dans ton cas
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 14 |
|
| 15 |
+
torch.save(prompt_embeds.cpu(), "embeds.pt")
|
| 16 |
+
return f"shape={tuple(prompt_embeds.shape)}", "embeds.pt"
|
| 17 |
|
| 18 |
demo = gr.Interface(
|
| 19 |
fn=encode_text,
|