recoilme commited on Sep 15, 2025

Commit

8308d70

1 Parent(s): d2849c3

simplevae

Browse files

Files changed (21) hide show

config.json +0 -38
create.ipynb +0 -0
diffusion_pytorch_model.safetensors +0 -3
final_vae/config.json +0 -38
final_vae/diffusion_pytorch_model.safetensors +0 -3
sdxl_vae/config.json +0 -38
sdxl_vae/diffusion_pytorch_model.safetensors +0 -3
sdxs_vae/.ipynb_checkpoints/config-checkpoint.json +0 -48
sdxs_vae/config.json +0 -48
sdxs_vae/diffusion_pytorch_model.safetensors +0 -3
simple_vae_nightly/config.json +0 -38
simple_vae_nightly/diffusion_pytorch_model.safetensors +0 -3
simple_vae_nightly2/config.json +0 -38
simple_vae_nightly2/diffusion_pytorch_model.safetensors +0 -3
test.ipynb +0 -95
vae/config.json +2 -2
vae/diffusion_pytorch_model.safetensors +2 -2
wan16x_vae_nightly/config.json +0 -129
wan16x_vae_nightly/diffusion_pytorch_model.safetensors +0 -3
wan16x_vae_nightly2/config.json +0 -129
wan16x_vae_nightly2/diffusion_pytorch_model.safetensors +0 -3

config.json DELETED Viewed

@@ -1,38 +0,0 @@
-{
-  "_class_name": "AutoencoderKL",
-  "_diffusers_version": "0.35.0.dev0",
-  "_name_or_path": "simple_vae",
-  "act_fn": "silu",
-  "block_out_channels": [
-    128,
-    256,
-    512,
-    512
-  ],
-  "down_block_types": [
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D"
-  ],
-  "force_upcast": false,
-  "in_channels": 3,
-  "latent_channels": 16,
-  "latents_mean": null,
-  "latents_std": null,
-  "layers_per_block": 2,
-  "mid_block_add_attention": true,
-  "norm_num_groups": 32,
-  "out_channels": 3,
-  "sample_size": 1024,
-  "scaling_factor": 1.0,
-  "shift_factor": 0,
-  "up_block_types": [
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D"
-  ],
-  "use_post_quant_conv": true,
-  "use_quant_conv": true
-}

create.ipynb DELETED Viewed

The diff for this file is too large to render. See raw diff

diffusion_pytorch_model.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f5f0a20e403669e880b510514ee575a2a9cb74a1b36ab0e31fc68ef66c2173d7
-size 335311892

final_vae/config.json DELETED Viewed

@@ -1,38 +0,0 @@
-{
-  "_class_name": "AutoencoderKL",
-  "_diffusers_version": "0.34.0",
-  "_name_or_path": "sdxl_vae",
-  "act_fn": "silu",
-  "block_out_channels": [
-    128,
-    256,
-    512,
-    512
-  ],
-  "down_block_types": [
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D"
-  ],
-  "force_upcast": false,
-  "in_channels": 3,
-  "latent_channels": 4,
-  "latents_mean": null,
-  "latents_std": null,
-  "layers_per_block": 2,
-  "mid_block_add_attention": true,
-  "norm_num_groups": 32,
-  "out_channels": 3,
-  "sample_size": 512,
-  "scaling_factor": 0.13025,
-  "shift_factor": null,
-  "up_block_types": [
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D"
-  ],
-  "use_post_quant_conv": true,
-  "use_quant_conv": true
-}

final_vae/diffusion_pytorch_model.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:00ba31cad0e49ebd19a8c62c72eef3d8e51271675f2cde0ec079aef89e44463d
-size 334643268

sdxl_vae/config.json DELETED Viewed

@@ -1,38 +0,0 @@
-{
-  "_class_name": "AutoencoderKL",
-  "_diffusers_version": "0.34.0",
-  "_name_or_path": "sdxl_vae",
-  "act_fn": "silu",
-  "block_out_channels": [
-    128,
-    256,
-    512,
-    512
-  ],
-  "down_block_types": [
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D"
-  ],
-  "force_upcast": false,
-  "in_channels": 3,
-  "latent_channels": 4,
-  "latents_mean": null,
-  "latents_std": null,
-  "layers_per_block": 2,
-  "mid_block_add_attention": true,
-  "norm_num_groups": 32,
-  "out_channels": 3,
-  "sample_size": 512,
-  "scaling_factor": 0.13025,
-  "shift_factor": null,
-  "up_block_types": [
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D"
-  ],
-  "use_post_quant_conv": true,
-  "use_quant_conv": true
-}

sdxl_vae/diffusion_pytorch_model.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:2fd955b1cc451f2cafb58a29e1e0a07589e34d364ddf3d93ccd21a16ff8d3e5c
-size 334643268

sdxs_vae/.ipynb_checkpoints/config-checkpoint.json DELETED Viewed

@@ -1,48 +0,0 @@
-{
-  "_class_name": "AsymmetricAutoencoderKL",
-  "_diffusers_version": "0.34.0",
-  "_name_or_path": "vae",
-  "act_fn": "silu",
-  "block_out_channels": [
-    128,
-    256,
-    512,
-    768,
-    768
-  ],
-  "down_block_out_channels": [
-    128,
-    256,
-    512,
-    512
-  ],
-  "down_block_types": [
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D"
-  ],
-  "force_upcast": false,
-  "in_channels": 3,
-  "latent_channels": 16,
-  "layers_per_down_block": 2,
-  "layers_per_up_block": 2,
-  "norm_num_groups": 32,
-  "out_channels": 3,
-  "sample_size": 1024,
-  "scaling_factor": 1,
-  "up_block_out_channels": [
-    128,
-    256,
-    512,
-    768,
-    768
-  ],
-  "up_block_types": [
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D"
-  ]
-}

sdxs_vae/config.json DELETED Viewed

@@ -1,48 +0,0 @@
-{
-  "_class_name": "AsymmetricAutoencoderKL",
-  "_diffusers_version": "0.34.0",
-  "_name_or_path": "vae",
-  "act_fn": "silu",
-  "block_out_channels": [
-    128,
-    256,
-    512,
-    768,
-    768
-  ],
-  "down_block_out_channels": [
-    128,
-    256,
-    512,
-    512
-  ],
-  "down_block_types": [
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D"
-  ],
-  "force_upcast": false,
-  "in_channels": 3,
-  "latent_channels": 16,
-  "layers_per_down_block": 2,
-  "layers_per_up_block": 2,
-  "norm_num_groups": 32,
-  "out_channels": 3,
-  "sample_size": 1024,
-  "scaling_factor": 1,
-  "up_block_out_channels": [
-    128,
-    256,
-    512,
-    768,
-    768
-  ],
-  "up_block_types": [
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D"
-  ]
-}

sdxs_vae/diffusion_pytorch_model.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:3c42f2525cd74fedf496b0d3bf2c1c2ec6eee59250d934c4d74a0b449ad2b627
-size 698002772

simple_vae_nightly/config.json DELETED Viewed

@@ -1,38 +0,0 @@
-{
-  "_class_name": "AutoencoderKL",
-  "_diffusers_version": "0.35.0.dev0",
-  "_name_or_path": "simple_vae",
-  "act_fn": "silu",
-  "block_out_channels": [
-    128,
-    256,
-    512,
-    512
-  ],
-  "down_block_types": [
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D"
-  ],
-  "force_upcast": false,
-  "in_channels": 3,
-  "latent_channels": 16,
-  "latents_mean": null,
-  "latents_std": null,
-  "layers_per_block": 2,
-  "mid_block_add_attention": true,
-  "norm_num_groups": 32,
-  "out_channels": 3,
-  "sample_size": 1024,
-  "scaling_factor": 1.0,
-  "shift_factor": 0,
-  "up_block_types": [
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D"
-  ],
-  "use_post_quant_conv": true,
-  "use_quant_conv": true
-}

simple_vae_nightly/diffusion_pytorch_model.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:b39620d0953839362425f03674e6c3e37f03d20be3fbd7f281baea4dfc336a40
-size 335311892

simple_vae_nightly2/config.json DELETED Viewed

@@ -1,38 +0,0 @@
-{
-  "_class_name": "AutoencoderKL",
-  "_diffusers_version": "0.35.0.dev0",
-  "_name_or_path": "simple_vae",
-  "act_fn": "silu",
-  "block_out_channels": [
-    128,
-    256,
-    512,
-    512
-  ],
-  "down_block_types": [
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D",
-    "DownEncoderBlock2D"
-  ],
-  "force_upcast": false,
-  "in_channels": 3,
-  "latent_channels": 16,
-  "latents_mean": null,
-  "latents_std": null,
-  "layers_per_block": 2,
-  "mid_block_add_attention": true,
-  "norm_num_groups": 32,
-  "out_channels": 3,
-  "sample_size": 1024,
-  "scaling_factor": 1.0,
-  "shift_factor": 0,
-  "up_block_types": [
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D",
-    "UpDecoderBlock2D"
-  ],
-  "use_post_quant_conv": true,
-  "use_quant_conv": true
-}

simple_vae_nightly2/diffusion_pytorch_model.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:edf84f6e6e4499cdf73c63d2442a923ee46bfea7b24e4bf04910cf9dd8c1f652
-size 335311892

test.ipynb DELETED Viewed

@@ -1,95 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "code",
-   "execution_count": 1,
-   "id": "4f62bfd9-5396-48e2-aac7-bdf639cab345",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "The config attributes {'block_out_channels': [128, 256, 512, 768, 768], 'force_upcast': False} were passed to AsymmetricAutoencoderKL, but are not expected and will be ignored. Please verify your config.json configuration file.\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "ok\n"
-     ]
-    }
-   ],
-   "source": [
-    "import torch\n",
-    "\n",
-    "from torchvision import transforms, utils\n",
-    "\n",
-    "import diffusers\n",
-    "from diffusers import AsymmetricAutoencoderKL\n",
-    "\n",
-    "from diffusers.utils import load_image\n",
-    "\n",
-    "def crop_image_to_nearest_divisible_by_8(img):\n",
-    "    # Check if the image height and width are divisible by 8\n",
-    "    if img.shape[1] % 8 == 0 and img.shape[2] % 8 == 0:\n",
-    "        return img\n",
-    "    else:\n",
-    "        # Calculate the closest lower resolution divisible by 8\n",
-    "        new_height = img.shape[1] - (img.shape[1] % 8)\n",
-    "        new_width = img.shape[2] - (img.shape[2] % 8)\n",
-    "        \n",
-    "        # Use CenterCrop to crop the image\n",
-    "        transform = transforms.CenterCrop((new_height, new_width), interpolation=transforms.InterpolationMode.BILINEAR)\n",
-    "        img = transform(img).to(torch.float32).clamp(-1, 1)\n",
-    "        \n",
-    "        return img\n",
-    "        \n",
-    "to_tensor = transforms.ToTensor()\n",
-    "\n",
-    "device = \"cuda\"\n",
-    "dtype=torch.float16\n",
-    "vae = AsymmetricAutoencoderKL.from_pretrained(\"vae\",torch_dtype=dtype).to(device).eval()\n",
-    "\n",
-    "image = load_image(\"generated.png\")\n",
-    "\n",
-    "image = crop_image_to_nearest_divisible_by_8(to_tensor(image)).unsqueeze(0).to(device,dtype=dtype)\n",
-    "\n",
-    "upscaled_image = vae(image).sample\n",
-    "# Save the reconstructed image\n",
-    "utils.save_image(upscaled_image, \"test.png\")\n",
-    "print('ok')"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "7e3ad326-c410-44b6-a738-15b7f7e15075",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.11.6"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}

vae/config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "_class_name": "AutoencoderKL",
-  "_diffusers_version": "0.35.0.dev0",
-  "_name_or_path": "simple_vae",
   "act_fn": "silu",
   "block_out_channels": [
     128,

 {
   "_class_name": "AutoencoderKL",
+  "_diffusers_version": "0.35.1",
+  "_name_or_path": "AiArtLab/simplevae",
   "act_fn": "silu",
   "block_out_channels": [
     128,

vae/diffusion_pytorch_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:744c01d5b33fcca51ca9839bb0afb14cce48a13e922d27d8b73ed92c5733dd0c
-size 335311892

 version https://git-lfs.github.com/spec/v1
+oid sha256:2ff1aa1cce9dcf003c7eb23548fdb62101fe9bdeedf30aa4a897b91a6ef13f93
+size 167669678

wan16x_vae_nightly/config.json DELETED Viewed

@@ -1,129 +0,0 @@
-{
-  "_class_name": "AutoencoderKLWan",
-  "_diffusers_version": "0.35.1",
-  "_name_or_path": "wan16x_vae",
-  "attn_scales": [],
-  "base_dim": 160,
-  "clip_output": false,
-  "decoder_base_dim": 256,
-  "dim_mult": [
-    1,
-    2,
-    4,
-    4
-  ],
-  "dropout": 0.0,
-  "in_channels": 12,
-  "is_residual": true,
-  "latents_mean": [
-    -0.2289,
-    -0.0052,
-    -0.1323,
-    -0.2339,
-    -0.2799,
-    0.0174,
-    0.1838,
-    0.1557,
-    -0.1382,
-    0.0542,
-    0.2813,
-    0.0891,
-    0.157,
-    -0.0098,
-    0.0375,
-    -0.1825,
-    -0.2246,
-    -0.1207,
-    -0.0698,
-    0.5109,
-    0.2665,
-    -0.2108,
-    -0.2158,
-    0.2502,
-    -0.2055,
-    -0.0322,
-    0.1109,
-    0.1567,
-    -0.0729,
-    0.0899,
-    -0.2799,
-    -0.123,
-    -0.0313,
-    -0.1649,
-    0.0117,
-    0.0723,
-    -0.2839,
-    -0.2083,
-    -0.052,
-    0.3748,
-    0.0152,
-    0.1957,
-    0.1433,
-    -0.2944,
-    0.3573,
-    -0.0548,
-    -0.1681,
-    -0.0667
-  ],
-  "latents_std": [
-    0.4765,
-    1.0364,
-    0.4514,
-    1.1677,
-    0.5313,
-    0.499,
-    0.4818,
-    0.5013,
-    0.8158,
-    1.0344,
-    0.5894,
-    1.0901,
-    0.6885,
-    0.6165,
-    0.8454,
-    0.4978,
-    0.5759,
-    0.3523,
-    0.7135,
-    0.6804,
-    0.5833,
-    1.4146,
-    0.8986,
-    0.5659,
-    0.7069,
-    0.5338,
-    0.4889,
-    0.4917,
-    0.4069,
-    0.4999,
-    0.6866,
-    0.4093,
-    0.5709,
-    0.6065,
-    0.6415,
-    0.4944,
-    0.5726,
-    1.2042,
-    0.5458,
-    1.6887,
-    0.3971,
-    1.06,
-    0.3943,
-    0.5537,
-    0.5444,
-    0.4089,
-    0.7468,
-    0.7744
-  ],
-  "num_res_blocks": 2,
-  "out_channels": 12,
-  "patch_size": 2,
-  "scale_factor_spatial": 16,
-  "scale_factor_temporal": 4,
-  "temperal_downsample": [
-    false,
-    true,
-    true
-  ],
-  "z_dim": 48
-}

wan16x_vae_nightly/diffusion_pytorch_model.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:5ba8f8440d69d3369abd2a6e7e76aea92a8c4014bf718bb23bb86223a157ca46
-size 2818777808

wan16x_vae_nightly2/config.json DELETED Viewed

@@ -1,129 +0,0 @@
-{
-  "_class_name": "AutoencoderKLWan",
-  "_diffusers_version": "0.35.1",
-  "_name_or_path": "wan16x_vae",
-  "attn_scales": [],
-  "base_dim": 160,
-  "clip_output": false,
-  "decoder_base_dim": 256,
-  "dim_mult": [
-    1,
-    2,
-    4,
-    4
-  ],
-  "dropout": 0.0,
-  "in_channels": 12,
-  "is_residual": true,
-  "latents_mean": [
-    -0.2289,
-    -0.0052,
-    -0.1323,
-    -0.2339,
-    -0.2799,
-    0.0174,
-    0.1838,
-    0.1557,
-    -0.1382,
-    0.0542,
-    0.2813,
-    0.0891,
-    0.157,
-    -0.0098,
-    0.0375,
-    -0.1825,
-    -0.2246,
-    -0.1207,
-    -0.0698,
-    0.5109,
-    0.2665,
-    -0.2108,
-    -0.2158,
-    0.2502,
-    -0.2055,
-    -0.0322,
-    0.1109,
-    0.1567,
-    -0.0729,
-    0.0899,
-    -0.2799,
-    -0.123,
-    -0.0313,
-    -0.1649,
-    0.0117,
-    0.0723,
-    -0.2839,
-    -0.2083,
-    -0.052,
-    0.3748,
-    0.0152,
-    0.1957,
-    0.1433,
-    -0.2944,
-    0.3573,
-    -0.0548,
-    -0.1681,
-    -0.0667
-  ],
-  "latents_std": [
-    0.4765,
-    1.0364,
-    0.4514,
-    1.1677,
-    0.5313,
-    0.499,
-    0.4818,
-    0.5013,
-    0.8158,
-    1.0344,
-    0.5894,
-    1.0901,
-    0.6885,
-    0.6165,
-    0.8454,
-    0.4978,
-    0.5759,
-    0.3523,
-    0.7135,
-    0.6804,
-    0.5833,
-    1.4146,
-    0.8986,
-    0.5659,
-    0.7069,
-    0.5338,
-    0.4889,
-    0.4917,
-    0.4069,
-    0.4999,
-    0.6866,
-    0.4093,
-    0.5709,
-    0.6065,
-    0.6415,
-    0.4944,
-    0.5726,
-    1.2042,
-    0.5458,
-    1.6887,
-    0.3971,
-    1.06,
-    0.3943,
-    0.5537,
-    0.5444,
-    0.4089,
-    0.7468,
-    0.7744
-  ],
-  "num_res_blocks": 2,
-  "out_channels": 12,
-  "patch_size": 2,
-  "scale_factor_spatial": 16,
-  "scale_factor_temporal": 4,
-  "temperal_downsample": [
-    false,
-    true,
-    true
-  ],
-  "z_dim": 48
-}

wan16x_vae_nightly2/diffusion_pytorch_model.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:a97241a505fc54a972fef91bb8006dee59116fa64de7c81f6f54a86ec9a04718
-size 2818777808