Buckets:
| import{s as se,n as ie,o as oe}from"../chunks/scheduler.182ea377.js";import{S as pe,i as de,g as i,s as a,r as U,A as re,h as o,f as n,c as s,j as ne,u as _,x as Z,k as le,y as me,a as l,v as $,d as j,t as J,w as v}from"../chunks/index.abf12888.js";import{C as P}from"../chunks/CodeBlock.57fe6e13.js";import{H as ae,E as fe}from"../chunks/EditOnGithub.9b8e78e4.js";function ue(Y){let p,W,k,G,d,V,r,F="Many diffusion systems share the same components, allowing you to adapt a pretrained model for one task to an entirely different task.",B,m,q='This guide will show you how to adapt a pretrained text-to-image model for inpainting by initializing and modifying the architecture of a pretrained <a href="/docs/diffusers/v0.28.2/en/api/models/unet2d-cond#diffusers.UNet2DConditionModel">UNet2DConditionModel</a>.',N,f,X,u,A='A <a href="/docs/diffusers/v0.28.2/en/api/models/unet2d-cond#diffusers.UNet2DConditionModel">UNet2DConditionModel</a> by default accepts 4 channels in the <a href="https://huggingface.co/docs/diffusers/v0.16.0/en/api/models#diffusers.UNet2DConditionModel.in_channels" rel="nofollow">input sample</a>. For example, load a pretrained text-to-image model like <a href="https://huggingface.co/runwayml/stable-diffusion-v1-5" rel="nofollow"><code>runwayml/stable-diffusion-v1-5</code></a> and take a look at the number of <code>in_channels</code>:',x,c,Q,h,K='Inpainting requires 9 channels in the input sample. You can check this value in a pretrained inpainting model like <a href="https://huggingface.co/runwayml/stable-diffusion-inpainting" rel="nofollow"><code>runwayml/stable-diffusion-inpainting</code></a>:',I,M,R,y,O="To adapt your text-to-image model for inpainting, you’ll need to change the number of <code>in_channels</code> from 4 to 9.",S,b,ee='Initialize a <a href="/docs/diffusers/v0.28.2/en/api/models/unet2d-cond#diffusers.UNet2DConditionModel">UNet2DConditionModel</a> with the pretrained text-to-image model weights, and change <code>in_channels</code> to 9. Changing the number of <code>in_channels</code> means you need to set <code>ignore_mismatched_sizes=True</code> and <code>low_cpu_mem_usage=False</code> to avoid a size mismatch error because the shape is different now.',E,w,H,g,te="The pretrained weights of the other components from the text-to-image model are initialized from their checkpoints, but the input channel weights (<code>conv_in.weight</code>) of the <code>unet</code> are randomly initialized. It is important to finetune the model for inpainting because otherwise the model returns noise.",z,T,D,C,L;return d=new ae({props:{title:"Adapt a model to a new task",local:"adapt-a-model-to-a-new-task",headingTag:"h1"}}),f=new ae({props:{title:"Configure UNet2DConditionModel parameters",local:"configure-unet2dconditionmodel-parameters",headingTag:"h2"}}),c=new P({props:{code:"ZnJvbSUyMGRpZmZ1c2VycyUyMGltcG9ydCUyMFN0YWJsZURpZmZ1c2lvblBpcGVsaW5lJTBBJTBBcGlwZWxpbmUlMjAlM0QlMjBTdGFibGVEaWZmdXNpb25QaXBlbGluZS5mcm9tX3ByZXRyYWluZWQoJTIycnVud2F5bWwlMkZzdGFibGUtZGlmZnVzaW9uLXYxLTUlMjIlMkMlMjB1c2Vfc2FmZXRlbnNvcnMlM0RUcnVlKSUwQXBpcGVsaW5lLnVuZXQuY29uZmlnJTVCJTIyaW5fY2hhbm5lbHMlMjIlNUQlMEE0",highlighted:`<span class="hljs-keyword">from</span> diffusers <span class="hljs-keyword">import</span> StableDiffusionPipeline | |
| pipeline = StableDiffusionPipeline.from_pretrained(<span class="hljs-string">"runwayml/stable-diffusion-v1-5"</span>, use_safetensors=<span class="hljs-literal">True</span>) | |
| pipeline.unet.config[<span class="hljs-string">"in_channels"</span>] | |
| <span class="hljs-number">4</span>`,wrap:!1}}),M=new P({props:{code:"ZnJvbSUyMGRpZmZ1c2VycyUyMGltcG9ydCUyMFN0YWJsZURpZmZ1c2lvblBpcGVsaW5lJTBBJTBBcGlwZWxpbmUlMjAlM0QlMjBTdGFibGVEaWZmdXNpb25QaXBlbGluZS5mcm9tX3ByZXRyYWluZWQoJTIycnVud2F5bWwlMkZzdGFibGUtZGlmZnVzaW9uLWlucGFpbnRpbmclMjIlMkMlMjB1c2Vfc2FmZXRlbnNvcnMlM0RUcnVlKSUwQXBpcGVsaW5lLnVuZXQuY29uZmlnJTVCJTIyaW5fY2hhbm5lbHMlMjIlNUQlMEE5",highlighted:`<span class="hljs-keyword">from</span> diffusers <span class="hljs-keyword">import</span> StableDiffusionPipeline | |
| pipeline = StableDiffusionPipeline.from_pretrained(<span class="hljs-string">"runwayml/stable-diffusion-inpainting"</span>, use_safetensors=<span class="hljs-literal">True</span>) | |
| pipeline.unet.config[<span class="hljs-string">"in_channels"</span>] | |
| <span class="hljs-number">9</span>`,wrap:!1}}),w=new P({props:{code:"ZnJvbSUyMGRpZmZ1c2VycyUyMGltcG9ydCUyMFVOZXQyRENvbmRpdGlvbk1vZGVsJTBBJTBBbW9kZWxfaWQlMjAlM0QlMjAlMjJydW53YXltbCUyRnN0YWJsZS1kaWZmdXNpb24tdjEtNSUyMiUwQXVuZXQlMjAlM0QlMjBVTmV0MkRDb25kaXRpb25Nb2RlbC5mcm9tX3ByZXRyYWluZWQoJTBBJTIwJTIwJTIwJTIwbW9kZWxfaWQlMkMlMEElMjAlMjAlMjAlMjBzdWJmb2xkZXIlM0QlMjJ1bmV0JTIyJTJDJTBBJTIwJTIwJTIwJTIwaW5fY2hhbm5lbHMlM0Q5JTJDJTBBJTIwJTIwJTIwJTIwbG93X2NwdV9tZW1fdXNhZ2UlM0RGYWxzZSUyQyUwQSUyMCUyMCUyMCUyMGlnbm9yZV9taXNtYXRjaGVkX3NpemVzJTNEVHJ1ZSUyQyUwQSUyMCUyMCUyMCUyMHVzZV9zYWZldGVuc29ycyUzRFRydWUlMkMlMEEp",highlighted:`<span class="hljs-keyword">from</span> diffusers <span class="hljs-keyword">import</span> UNet2DConditionModel | |
| model_id = <span class="hljs-string">"runwayml/stable-diffusion-v1-5"</span> | |
| unet = UNet2DConditionModel.from_pretrained( | |
| model_id, | |
| subfolder=<span class="hljs-string">"unet"</span>, | |
| in_channels=<span class="hljs-number">9</span>, | |
| low_cpu_mem_usage=<span class="hljs-literal">False</span>, | |
| ignore_mismatched_sizes=<span class="hljs-literal">True</span>, | |
| use_safetensors=<span class="hljs-literal">True</span>, | |
| )`,wrap:!1}}),T=new fe({props:{source:"https://github.com/huggingface/diffusers/blob/main/docs/source/en/training/adapt_a_model.md"}}),{c(){p=i("meta"),W=a(),k=i("p"),G=a(),U(d.$$.fragment),V=a(),r=i("p"),r.textContent=F,B=a(),m=i("p"),m.innerHTML=q,N=a(),U(f.$$.fragment),X=a(),u=i("p"),u.innerHTML=A,x=a(),U(c.$$.fragment),Q=a(),h=i("p"),h.innerHTML=K,I=a(),U(M.$$.fragment),R=a(),y=i("p"),y.innerHTML=O,S=a(),b=i("p"),b.innerHTML=ee,E=a(),U(w.$$.fragment),H=a(),g=i("p"),g.innerHTML=te,z=a(),U(T.$$.fragment),D=a(),C=i("p"),this.h()},l(e){const t=re("svelte-u9bgzb",document.head);p=o(t,"META",{name:!0,content:!0}),t.forEach(n),W=s(e),k=o(e,"P",{}),ne(k).forEach(n),G=s(e),_(d.$$.fragment,e),V=s(e),r=o(e,"P",{"data-svelte-h":!0}),Z(r)!=="svelte-3om45r"&&(r.textContent=F),B=s(e),m=o(e,"P",{"data-svelte-h":!0}),Z(m)!=="svelte-1xp9uqj"&&(m.innerHTML=q),N=s(e),_(f.$$.fragment,e),X=s(e),u=o(e,"P",{"data-svelte-h":!0}),Z(u)!=="svelte-1bcplok"&&(u.innerHTML=A),x=s(e),_(c.$$.fragment,e),Q=s(e),h=o(e,"P",{"data-svelte-h":!0}),Z(h)!=="svelte-ph2jy1"&&(h.innerHTML=K),I=s(e),_(M.$$.fragment,e),R=s(e),y=o(e,"P",{"data-svelte-h":!0}),Z(y)!=="svelte-15mkgo9"&&(y.innerHTML=O),S=s(e),b=o(e,"P",{"data-svelte-h":!0}),Z(b)!=="svelte-v7fif9"&&(b.innerHTML=ee),E=s(e),_(w.$$.fragment,e),H=s(e),g=o(e,"P",{"data-svelte-h":!0}),Z(g)!=="svelte-6j6lxu"&&(g.innerHTML=te),z=s(e),_(T.$$.fragment,e),D=s(e),C=o(e,"P",{}),ne(C).forEach(n),this.h()},h(){le(p,"name","hf:doc:metadata"),le(p,"content",ce)},m(e,t){me(document.head,p),l(e,W,t),l(e,k,t),l(e,G,t),$(d,e,t),l(e,V,t),l(e,r,t),l(e,B,t),l(e,m,t),l(e,N,t),$(f,e,t),l(e,X,t),l(e,u,t),l(e,x,t),$(c,e,t),l(e,Q,t),l(e,h,t),l(e,I,t),$(M,e,t),l(e,R,t),l(e,y,t),l(e,S,t),l(e,b,t),l(e,E,t),$(w,e,t),l(e,H,t),l(e,g,t),l(e,z,t),$(T,e,t),l(e,D,t),l(e,C,t),L=!0},p:ie,i(e){L||(j(d.$$.fragment,e),j(f.$$.fragment,e),j(c.$$.fragment,e),j(M.$$.fragment,e),j(w.$$.fragment,e),j(T.$$.fragment,e),L=!0)},o(e){J(d.$$.fragment,e),J(f.$$.fragment,e),J(c.$$.fragment,e),J(M.$$.fragment,e),J(w.$$.fragment,e),J(T.$$.fragment,e),L=!1},d(e){e&&(n(W),n(k),n(G),n(V),n(r),n(B),n(m),n(N),n(X),n(u),n(x),n(Q),n(h),n(I),n(R),n(y),n(S),n(b),n(E),n(H),n(g),n(z),n(D),n(C)),n(p),v(d,e),v(f,e),v(c,e),v(M,e),v(w,e),v(T,e)}}}const ce='{"title":"Adapt a model to a new task","local":"adapt-a-model-to-a-new-task","sections":[{"title":"Configure UNet2DConditionModel parameters","local":"configure-unet2dconditionmodel-parameters","sections":[],"depth":2}],"depth":1}';function he(Y){return oe(()=>{new URLSearchParams(window.location.search).get("fw")}),[]}class ge extends pe{constructor(p){super(),de(this,p,he,ue,se,{})}}export{ge as component}; | |
Xet Storage Details
- Size:
- 8.16 kB
- Xet hash:
- f2ca32eae2371a0454d3fabc7c6c83dbc37386f4729b8bae4eececee611cae42
·
Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.