Update README.md
Browse files
README.md
CHANGED
|
@@ -68,14 +68,16 @@ pip install optimum-quanto
|
|
| 68 |
2. Run the script:
|
| 69 |
```python
|
| 70 |
import torch
|
| 71 |
-
from safetensors.torch import save_file
|
| 72 |
|
| 73 |
-
from diffusers import FluxTransformer2DModel
|
| 74 |
-
from optimum.quanto import freeze, qfloat8, quantize
|
|
|
|
|
|
|
|
|
|
| 75 |
|
| 76 |
transformer = FluxTransformer2DModel.from_single_file("modern-anime.safetensors", torch_dtype=torch.bfloat16)
|
| 77 |
-
quantize(transformer, weights=qfloat8)
|
| 78 |
-
freeze(transformer)
|
| 79 |
|
| 80 |
transformer.save_pretrained("transformer")
|
| 81 |
```
|
|
|
|
| 68 |
2. Run the script:
|
| 69 |
```python
|
| 70 |
import torch
|
| 71 |
+
from safetensors.torch import save_file, load_file
|
| 72 |
|
| 73 |
+
from diffusers import FluxTransformer2DModel
|
| 74 |
+
from optimum.quanto import freeze, qfloat8, quantize, QuantizedDiffusersModel
|
| 75 |
+
|
| 76 |
+
class QuantizedFlux2DModel(QuantizedDiffusersModel):
|
| 77 |
+
base_class = FluxTransformer2DModel
|
| 78 |
|
| 79 |
transformer = FluxTransformer2DModel.from_single_file("modern-anime.safetensors", torch_dtype=torch.bfloat16)
|
| 80 |
+
transformer = QuantizedFlux2DModel.quantize(transformer, weights=qfloat8)
|
|
|
|
| 81 |
|
| 82 |
transformer.save_pretrained("transformer")
|
| 83 |
```
|