File size: 2,474 Bytes
f3d279e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
{
  "source_repo": "ideogram-ai/ideogram-4-fp8",
  "target_repo": "WaveCut/ideogram-4-sdnq-uint4",
  "quantization": {
    "weights_dtype": "uint4",
    "group_size": 0,
    "use_svd": false,
    "use_dynamic_quantization": false,
    "use_stochastic_rounding": false,
    "dequantize_fp32": false,
    "add_skip_keys": false
  },
  "components": {
    "transformer": {
      "file": "model/transformer/diffusion_pytorch_model.safetensors",
      "storage_mb": 4979.658447265625,
      "num_state_tensors": 880,
      "source_materialized_storage_mb": 17698.838134765625,
      "name": "quantize_transformer",
      "elapsed_seconds": 112.6355704489979,
      "gpu_before_mb": 561,
      "gpu_after_mb": 649,
      "gpu_peak_mb": 36525,
      "torch_peak_allocated_mb": 0.0,
      "torch_peak_reserved_mb": 0.0,
      "component": "transformer"
    },
    "unconditional_transformer": {
      "file": "model/unconditional_transformer/diffusion_pytorch_model.safetensors",
      "storage_mb": 4979.658447265625,
      "num_state_tensors": 880,
      "source_materialized_storage_mb": 17698.838134765625,
      "name": "quantize_unconditional_transformer",
      "elapsed_seconds": 108.67946223300532,
      "gpu_before_mb": 649,
      "gpu_after_mb": 649,
      "gpu_peak_mb": 36525,
      "torch_peak_allocated_mb": 0.0,
      "torch_peak_reserved_mb": 0.0,
      "component": "unconditional_transformer"
    },
    "text_encoder": {
      "storage_mb": 4097.525390625,
      "source_materialized_storage_mb": 14435.587890625,
      "num_state_tensors": 904,
      "name": "quantize_text_encoder",
      "elapsed_seconds": 102.32456034698407,
      "gpu_before_mb": 649,
      "gpu_after_mb": 649,
      "gpu_peak_mb": 24477,
      "torch_peak_allocated_mb": 0.0,
      "torch_peak_reserved_mb": 0.0,
      "component": "text_encoder"
    },
    "vae": {
      "file": "model/vae/diffusion_pytorch_model.safetensors",
      "storage_mb": 50.18652153015137,
      "num_state_tensors": 395,
      "source_materialized_storage_mb": 160.30573844909668,
      "name": "quantize_vae",
      "elapsed_seconds": 2.675335832987912,
      "gpu_before_mb": 649,
      "gpu_after_mb": 649,
      "gpu_peak_mb": 861,
      "torch_peak_allocated_mb": 0.0,
      "torch_peak_reserved_mb": 0.0,
      "component": "vae"
    }
  },
  "scaffolding": {
    "snapshot": "/root/.cache/huggingface/hub/models--ideogram-ai--ideogram-4-fp8/snapshots/ee79a7237b519f1402ceacf952f30c8a31ec5073"
  }
}