File size: 4,730 Bytes
6738b2c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
{
  "validation_date": "2026-06-04",
  "machine": "Apple M5 Max, 128 GiB unified memory",
  "profile": {
    "prompt": "A short cinematic video of a glowing orange glass sphere floating above calm teal water, soft reflections, gentle camera movement",
    "negative_prompt": "",
    "width": 1280,
    "height": 704,
    "frames": 17,
    "steps": 20,
    "guidance": 5,
    "fps": 24,
    "seed": 321
  },
  "layouts": {
    "base_source": {
      "repo": "Wan-AI/Wan2.2-TI2V-5B-Diffusers",
      "storage_gib": 31.85,
      "mp4": "base-source.mp4",
      "total_seconds": 216.15181183815002,
      "generation_seconds": 215.164,
      "physical_peak_gib": 102.67981120198965,
      "rss_peak_gib": 13.703689575195312,
      "resident_peak_gib": 13.702316284179688,
      "mlx_peak_gib": 58.507674764841795,
      "mlx_active_after_generate_gib": 10.348156608641148,
      "mlx_cache_after_generate_gib": 0.48403943702578545,
      "logical_model_gib": 10.62639182060957,
      "logical_transformer_gib": 9.313806891441345,
      "logical_vae_gib": 1.3125849291682243,
      "model_bits": null,
      "health": {
        "source": "validation_outputs/ti2v_memory_profile_2026_06_04/base_source.mp4",
        "frame_count": 17,
        "width": 1280,
        "height": 704,
        "fps": 24.0,
        "luma_min": 7.228399753570557,
        "luma_max": 246.07899475097656,
        "luma_mean": 174.08145500631895,
        "mean_temporal_delta": 0.7045322582125664
      }
    },
    "prepared_bf16": {
      "repo": "AbstractFramework/wan2.2-ti2v-5b-diffusers-bf16",
      "storage_gib": 21.22,
      "mp4": "prepared-bf16.mp4",
      "total_seconds": 261.56354999542236,
      "generation_seconds": 260.648,
      "physical_peak_gib": 102.583978459239,
      "rss_peak_gib": 14.515884399414062,
      "resident_peak_gib": 14.515884399414062,
      "mlx_peak_gib": 58.472518514841795,
      "mlx_active_after_generate_gib": 10.348156608641148,
      "mlx_cache_after_generate_gib": 0.48403943702578545,
      "logical_model_gib": 10.62639182060957,
      "logical_transformer_gib": 9.313806891441345,
      "logical_vae_gib": 1.3125849291682243,
      "model_bits": null,
      "health": {
        "source": "validation_outputs/ti2v_memory_profile_2026_06_04/prepared_bf16.mp4",
        "frame_count": 17,
        "width": 1280,
        "height": 704,
        "fps": 24.0,
        "luma_min": 7.228399753570557,
        "luma_max": 246.07899475097656,
        "luma_mean": 174.08145500631895,
        "mean_temporal_delta": 0.7045322582125664
      }
    },
    "mixed_q8_bf16": {
      "repo": "AbstractFramework/wan2.2-ti2v-5b-diffusers-8bit",
      "storage_gib": 16.86,
      "mp4": "mixed-q8-bf16.mp4",
      "total_seconds": 243.38612413406372,
      "generation_seconds": 242.664,
      "physical_peak_gib": 103.74846588075161,
      "rss_peak_gib": 13.800796508789062,
      "resident_peak_gib": 13.79901123046875,
      "mlx_peak_gib": 54.187850546091795,
      "mlx_active_after_generate_gib": 6.063488639891148,
      "mlx_cache_after_generate_gib": 0.48403943702578545,
      "logical_model_gib": 6.3417238518595695,
      "logical_transformer_gib": 5.029138922691345,
      "logical_vae_gib": 1.3125849291682243,
      "model_bits": 8,
      "health": {
        "source": "validation_outputs/ti2v_memory_profile_2026_06_04/mixed_q8_bf16.mp4",
        "frame_count": 17,
        "width": 1280,
        "height": 704,
        "fps": 24.0,
        "luma_min": 7.866199493408203,
        "luma_max": 246.94140625,
        "luma_mean": 174.77739491182214,
        "mean_temporal_delta": 0.6711972616612911
      }
    }
  },
  "comparisons": {
    "base_vs_prepared_bf16": {
      "frame_count": 17,
      "byte_identical_decoded_frames": true,
      "mean_frame_mae": 0.0,
      "max_frame_mae": 0.0,
      "max_abs_channel_delta": 0
    },
    "base_vs_mixed_q8_bf16": {
      "frame_count": 17,
      "byte_identical_decoded_frames": false,
      "mean_frame_mae": 1.6606264709363858,
      "max_frame_mae": 1.7536328864820077,
      "max_abs_channel_delta": 133
    },
    "prepared_bf16_vs_mixed_q8_bf16": {
      "frame_count": 17,
      "byte_identical_decoded_frames": false,
      "mean_frame_mae": 1.6606264709363858,
      "max_frame_mae": 1.7536328864820077,
      "max_abs_channel_delta": 133
    }
  },
  "interpretation": {
    "prepared_bf16": "Storage/download reduction only for this profile; MLX-Gen already casts upstream Wan transformer and VAE weights to BF16 at runtime.",
    "mixed_q8_bf16": "Reduces storage, logical model bytes, active MLX bytes, and MLX allocator peak. This profile did not reduce full-process Darwin physical peak because non-model transient memory dominated the run."
  }
}