codeShare commited on
Commit
ff3a93d
·
verified ·
1 Parent(s): fdf075a

Upload SDNQ quantized Klein9B DarkBeast transformer

Browse files
Files changed (2) hide show
  1. config.json +74 -0
  2. diffusion_pytorch_model.safetensors +3 -0
config.json ADDED
@@ -0,0 +1,74 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "Flux2Transformer2DModel",
3
+ "_diffusers_version": "0.37.1",
4
+ "_name_or_path": "/content/unquant_transformer",
5
+ "attention_head_dim": 128,
6
+ "axes_dims_rope": [
7
+ 32,
8
+ 32,
9
+ 32,
10
+ 32
11
+ ],
12
+ "eps": 1e-06,
13
+ "guidance_embeds": false,
14
+ "in_channels": 128,
15
+ "joint_attention_dim": 12288,
16
+ "mlp_ratio": 3.0,
17
+ "num_attention_heads": 32,
18
+ "num_layers": 8,
19
+ "num_single_layers": 24,
20
+ "out_channels": null,
21
+ "patch_size": 1,
22
+ "quantization_config": {
23
+ "add_skip_keys": true,
24
+ "dequantize_fp32": true,
25
+ "dynamic_loss_threshold": 0.01,
26
+ "group_size": 0,
27
+ "is_integer": true,
28
+ "is_training": false,
29
+ "modules_dtype_dict": {
30
+ "int8": [
31
+ "context_embedder",
32
+ "x_embedder",
33
+ "proj_out",
34
+ "norm_out"
35
+ ]
36
+ },
37
+ "modules_quant_config": {},
38
+ "modules_to_not_convert": [
39
+ "double_stream_modulation_txt",
40
+ "time_guidance_embed",
41
+ "context_embedder",
42
+ "norm_k",
43
+ "norm_q",
44
+ "proj_out",
45
+ "x_embedder",
46
+ "norm_added_k",
47
+ ".proj_out",
48
+ "norm_out",
49
+ "single_stream_modulation",
50
+ "double_stream_modulation_img",
51
+ "norm_added_q"
52
+ ],
53
+ "non_blocking": false,
54
+ "quant_conv": false,
55
+ "quant_embedding": false,
56
+ "quant_method": "sdnq",
57
+ "quantization_device": "cuda",
58
+ "quantized_matmul_dtype": null,
59
+ "return_device": "cpu",
60
+ "sdnq_version": "0.1.8",
61
+ "svd_rank": 32,
62
+ "svd_steps": 32,
63
+ "use_dynamic_quantization": true,
64
+ "use_grad_ckpt": true,
65
+ "use_quantized_matmul": true,
66
+ "use_quantized_matmul_conv": false,
67
+ "use_static_quantization": true,
68
+ "use_stochastic_rounding": false,
69
+ "use_svd": true,
70
+ "weights_dtype": "uint4"
71
+ },
72
+ "rope_theta": 2000,
73
+ "timestep_guidance_channels": 256
74
+ }
diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc8c699a5e32ce607d349637a65a179e47e0221943af29104d21913df6f71e0b
3
+ size 9078610304