Buckets:

rtrm's picture
download
raw
17.3 kB
import{s as Z,n as J,o as K}from"../chunks/scheduler.412302f6.js";import{S as X,i as ee,g as d,s as n,r as B,A as te,h as r,f as i,c as o,j as F,x as _,u as O,k as A,y as ie,a,v as j,d as Q,t as N,w as W}from"../chunks/index.f36f02f5.js";import{H as Y}from"../chunks/Heading.41d80af4.js";function ae(E){let l,w,x,I,s,H='<br/> <img src="https://raw.githubusercontent.com/huggingface/diffusers/77aadfee6a891ab9fcfb780f87c693f7a5beeb8e/docs/source/imgs/diffusers_library.jpg" width="400"/> <br/>',y,p,G,u,$=`🤗 Diffusers 是一个值得首选用于生成图像、音频甚至 3D 分子结构的,最先进的预训练扩散模型库。
无论您是在寻找简单的推理解决方案,还是想训练自己的扩散模型,🤗 Diffusers 这一模块化工具箱都能对其提供支持。
本库的设计更偏重于<a href="conceptual/philosophy#usability-over-performance">可用而非高性能</a>、<a href="conceptual/philosophy#simple-over-easy">简明而非简单</a>以及<a href="conceptual/philosophy#tweakable-contributorfriendly-over-abstraction">易用而非抽象</a>。`,D,g,U="本库包含三个主要组件:",T,h,R='<li>最先进的扩散管道 <a href="api/pipelines/overview">diffusion pipelines</a>,只需几行代码即可进行推理。</li> <li>可交替使用的各种噪声调度器 <a href="api/schedulers/overview">noise schedulers</a>,用于平衡生成速度和质量。</li> <li>预训练模型 <a href="api/models">models</a>,可作为构建模块,并与调度程序结合使用,来创建您自己的端到端扩散系统。</li>',M,f,V='<div class="w-full flex flex-col space-y-4 md:space-y-0 md:grid md:grid-cols-2 md:gap-y-4 md:gap-x-5"><a class="!no-underline border dark:border-gray-700 p-5 rounded-lg shadow hover:shadow-lg" href="./tutorials/tutorial_overview"><div class="w-full text-center bg-gradient-to-br from-blue-400 to-blue-500 rounded-lg py-1.5 font-semibold mb-5 text-white text-lg leading-relaxed">Tutorials</div> <p class="text-gray-700">Learn the fundamental skills you need to start generating outputs, build your own diffusion system, and train a diffusion model. We recommend starting here if you&#39;re using 🤗 Diffusers for the first time!</p></a> <a class="!no-underline border dark:border-gray-700 p-5 rounded-lg shadow hover:shadow-lg" href="./using-diffusers/loading_overview"><div class="w-full text-center bg-gradient-to-br from-indigo-400 to-indigo-500 rounded-lg py-1.5 font-semibold mb-5 text-white text-lg leading-relaxed">How-to guides</div> <p class="text-gray-700">Practical guides for helping you load pipelines, models, and schedulers. You&#39;ll also learn how to use pipelines for specific tasks, control how outputs are generated, optimize for inference speed, and different training techniques.</p></a> <a class="!no-underline border dark:border-gray-700 p-5 rounded-lg shadow hover:shadow-lg" href="./conceptual/philosophy"><div class="w-full text-center bg-gradient-to-br from-pink-400 to-pink-500 rounded-lg py-1.5 font-semibold mb-5 text-white text-lg leading-relaxed">Conceptual guides</div> <p class="text-gray-700">Understand why the library was designed the way it was, and learn more about the ethical guidelines and safety implementations for using the library.</p></a> <a class="!no-underline border dark:border-gray-700 p-5 rounded-lg shadow hover:shadow-lg" href="./api/models"><div class="w-full text-center bg-gradient-to-br from-purple-400 to-purple-500 rounded-lg py-1.5 font-semibold mb-5 text-white text-lg leading-relaxed">Reference</div> <p class="text-gray-700">Technical descriptions of how 🤗 Diffusers classes and methods work.</p></a></div>',S,c,L,m,q="下表汇总了当前所有官方支持的pipelines及其对应的论文.",C,b,z='<thead><tr><th>管道</th> <th>论文/仓库</th> <th align="center">任务</th></tr></thead> <tbody><tr><td><a href="./api/pipelines/alt_diffusion">alt_diffusion</a></td> <td><a href="https://arxiv.org/abs/2211.06679" rel="nofollow">AltCLIP: Altering the Language Encoder in CLIP for Extended Language Capabilities</a></td> <td align="center">Image-to-Image Text-Guided Generation</td></tr> <tr><td><a href="./api/pipelines/audio_diffusion">audio_diffusion</a></td> <td><a href="https://github.com/teticio/audio-diffusion.git" rel="nofollow">Audio Diffusion</a></td> <td align="center">Unconditional Audio Generation</td></tr> <tr><td><a href="./api/pipelines/stable_diffusion/controlnet">controlnet</a></td> <td><a href="https://arxiv.org/abs/2302.05543" rel="nofollow">Adding Conditional Control to Text-to-Image Diffusion Models</a></td> <td align="center">Image-to-Image Text-Guided Generation</td></tr> <tr><td><a href="./api/pipelines/cycle_diffusion">cycle_diffusion</a></td> <td><a href="https://arxiv.org/abs/2210.05559" rel="nofollow">Unifying Diffusion Models’ Latent Space, with Applications to CycleDiffusion and Guidance</a></td> <td align="center">Image-to-Image Text-Guided Generation</td></tr> <tr><td><a href="./api/pipelines/dance_diffusion">dance_diffusion</a></td> <td><a href="https://github.com/williamberman/diffusers.git" rel="nofollow">Dance Diffusion</a></td> <td align="center">Unconditional Audio Generation</td></tr> <tr><td><a href="./api/pipelines/ddpm">ddpm</a></td> <td><a href="https://arxiv.org/abs/2006.11239" rel="nofollow">Denoising Diffusion Probabilistic Models</a></td> <td align="center">Unconditional Image Generation</td></tr> <tr><td><a href="./api/pipelines/ddim">ddim</a></td> <td><a href="https://arxiv.org/abs/2010.02502" rel="nofollow">Denoising Diffusion Implicit Models</a></td> <td align="center">Unconditional Image Generation</td></tr> <tr><td><a href="./if">if</a></td> <td><a href="./api/pipelines/if"><strong>IF</strong></a></td> <td align="center">Image Generation</td></tr> <tr><td><a href="./if">if_img2img</a></td> <td><a href="./api/pipelines/if"><strong>IF</strong></a></td> <td align="center">Image-to-Image Generation</td></tr> <tr><td><a href="./if">if_inpainting</a></td> <td><a href="./api/pipelines/if"><strong>IF</strong></a></td> <td align="center">Image-to-Image Generation</td></tr> <tr><td><a href="./api/pipelines/latent_diffusion">latent_diffusion</a></td> <td><a href="https://arxiv.org/abs/2112.10752" rel="nofollow">High-Resolution Image Synthesis with Latent Diffusion Models</a></td> <td align="center">Text-to-Image Generation</td></tr> <tr><td><a href="./api/pipelines/latent_diffusion">latent_diffusion</a></td> <td><a href="https://arxiv.org/abs/2112.10752" rel="nofollow">High-Resolution Image Synthesis with Latent Diffusion Models</a></td> <td align="center">Super Resolution Image-to-Image</td></tr> <tr><td><a href="./api/pipelines/latent_diffusion_uncond">latent_diffusion_uncond</a></td> <td><a href="https://arxiv.org/abs/2112.10752" rel="nofollow">High-Resolution Image Synthesis with Latent Diffusion Models</a></td> <td align="center">Unconditional Image Generation</td></tr> <tr><td><a href="./api/pipelines/paint_by_example">paint_by_example</a></td> <td><a href="https://arxiv.org/abs/2211.13227" rel="nofollow">Paint by Example: Exemplar-based Image Editing with Diffusion Models</a></td> <td align="center">Image-Guided Image Inpainting</td></tr> <tr><td><a href="./api/pipelines/pndm">pndm</a></td> <td><a href="https://arxiv.org/abs/2202.09778" rel="nofollow">Pseudo Numerical Methods for Diffusion Models on Manifolds</a></td> <td align="center">Unconditional Image Generation</td></tr> <tr><td><a href="./api/pipelines/score_sde_ve">score_sde_ve</a></td> <td><a href="https://openreview.net/forum?id=PxTIG12RRHS" rel="nofollow">Score-Based Generative Modeling through Stochastic Differential Equations</a></td> <td align="center">Unconditional Image Generation</td></tr> <tr><td><a href="./api/pipelines/score_sde_vp">score_sde_vp</a></td> <td><a href="https://openreview.net/forum?id=PxTIG12RRHS" rel="nofollow">Score-Based Generative Modeling through Stochastic Differential Equations</a></td> <td align="center">Unconditional Image Generation</td></tr> <tr><td><a href="./api/pipelines/semantic_stable_diffusion">semantic_stable_diffusion</a></td> <td><a href="https://arxiv.org/abs/2301.12247" rel="nofollow">Semantic Guidance</a></td> <td align="center">Text-Guided Generation</td></tr> <tr><td><a href="./api/pipelines/stable_diffusion/text2img">stable_diffusion_text2img</a></td> <td><a href="https://stability.ai/blog/stable-diffusion-public-release" rel="nofollow">Stable Diffusion</a></td> <td align="center">Text-to-Image Generation</td></tr> <tr><td><a href="./api/pipelines/stable_diffusion/img2img">stable_diffusion_img2img</a></td> <td><a href="https://stability.ai/blog/stable-diffusion-public-release" rel="nofollow">Stable Diffusion</a></td> <td align="center">Image-to-Image Text-Guided Generation</td></tr> <tr><td><a href="./api/pipelines/stable_diffusion/inpaint">stable_diffusion_inpaint</a></td> <td><a href="https://stability.ai/blog/stable-diffusion-public-release" rel="nofollow">Stable Diffusion</a></td> <td align="center">Text-Guided Image Inpainting</td></tr> <tr><td><a href="./api/pipelines/stable_diffusion/panorama">stable_diffusion_panorama</a></td> <td><a href="https://multidiffusion.github.io/" rel="nofollow">MultiDiffusion</a></td> <td align="center">Text-to-Panorama Generation</td></tr> <tr><td><a href="./api/pipelines/stable_diffusion/pix2pix">stable_diffusion_pix2pix</a></td> <td><a href="https://arxiv.org/abs/2211.09800" rel="nofollow">InstructPix2Pix: Learning to Follow Image Editing Instructions</a></td> <td align="center">Text-Guided Image Editing</td></tr> <tr><td><a href="./api/pipelines/stable_diffusion/pix2pix_zero">stable_diffusion_pix2pix_zero</a></td> <td><a href="https://pix2pixzero.github.io/" rel="nofollow">Zero-shot Image-to-Image Translation</a></td> <td align="center">Text-Guided Image Editing</td></tr> <tr><td><a href="./api/pipelines/stable_diffusion/attend_and_excite">stable_diffusion_attend_and_excite</a></td> <td><a href="https://arxiv.org/abs/2301.13826" rel="nofollow">Attend-and-Excite: Attention-Based Semantic Guidance for Text-to-Image Diffusion Models</a></td> <td align="center">Text-to-Image Generation</td></tr> <tr><td><a href="./api/pipelines/stable_diffusion/self_attention_guidance">stable_diffusion_self_attention_guidance</a></td> <td><a href="https://arxiv.org/abs/2210.00939" rel="nofollow">Improving Sample Quality of Diffusion Models Using Self-Attention Guidance</a></td> <td align="center">Text-to-Image Generation Unconditional Image Generation</td></tr> <tr><td><a href="./stable_diffusion/image_variation">stable_diffusion_image_variation</a></td> <td><a href="https://github.com/LambdaLabsML/lambda-diffusers#stable-diffusion-image-variations" rel="nofollow">Stable Diffusion Image Variations</a></td> <td align="center">Image-to-Image Generation</td></tr> <tr><td><a href="./stable_diffusion/latent_upscale">stable_diffusion_latent_upscale</a></td> <td><a href="https://twitter.com/StabilityAI/status/1590531958815064065" rel="nofollow">Stable Diffusion Latent Upscaler</a></td> <td align="center">Text-Guided Super Resolution Image-to-Image</td></tr> <tr><td><a href="./api/pipelines/stable_diffusion/model_editing">stable_diffusion_model_editing</a></td> <td><a href="https://time-diffusion.github.io/" rel="nofollow">Editing Implicit Assumptions in Text-to-Image Diffusion Models</a></td> <td align="center">Text-to-Image Model Editing</td></tr> <tr><td><a href="./api/pipelines/stable_diffusion_2">stable_diffusion_2</a></td> <td><a href="https://stability.ai/blog/stable-diffusion-v2-release" rel="nofollow">Stable Diffusion 2</a></td> <td align="center">Text-to-Image Generation</td></tr> <tr><td><a href="./api/pipelines/stable_diffusion_2">stable_diffusion_2</a></td> <td><a href="https://stability.ai/blog/stable-diffusion-v2-release" rel="nofollow">Stable Diffusion 2</a></td> <td align="center">Text-Guided Image Inpainting</td></tr> <tr><td><a href="./api/pipelines/stable_diffusion_2">stable_diffusion_2</a></td> <td><a href="https://github.com/Stability-AI/stablediffusion#depth-conditional-stable-diffusion" rel="nofollow">Depth-Conditional Stable Diffusion</a></td> <td align="center">Depth-to-Image Generation</td></tr> <tr><td><a href="./api/pipelines/stable_diffusion_2">stable_diffusion_2</a></td> <td><a href="https://stability.ai/blog/stable-diffusion-v2-release" rel="nofollow">Stable Diffusion 2</a></td> <td align="center">Text-Guided Super Resolution Image-to-Image</td></tr> <tr><td><a href="./api/pipelines/stable_diffusion_safe">stable_diffusion_safe</a></td> <td><a href="https://arxiv.org/abs/2211.05105" rel="nofollow">Safe Stable Diffusion</a></td> <td align="center">Text-Guided Generation</td></tr> <tr><td><a href="./stable_unclip">stable_unclip</a></td> <td>Stable unCLIP</td> <td align="center">Text-to-Image Generation</td></tr> <tr><td><a href="./stable_unclip">stable_unclip</a></td> <td>Stable unCLIP</td> <td align="center">Image-to-Image Text-Guided Generation</td></tr> <tr><td><a href="./api/pipelines/stochastic_karras_ve">stochastic_karras_ve</a></td> <td><a href="https://arxiv.org/abs/2206.00364" rel="nofollow">Elucidating the Design Space of Diffusion-Based Generative Models</a></td> <td align="center">Unconditional Image Generation</td></tr> <tr><td><a href="./api/pipelines/text_to_video">text_to_video_sd</a></td> <td><a href="https://modelscope.cn/models/damo/text-to-video-synthesis/summary" rel="nofollow">Modelscope’s Text-to-video-synthesis Model in Open Domain</a></td> <td align="center">Text-to-Video Generation</td></tr> <tr><td><a href="./api/pipelines/unclip">unclip</a></td> <td><a href="https://arxiv.org/abs/2204.06125" rel="nofollow">Hierarchical Text-Conditional Image Generation with CLIP Latents</a>(implementation by <a href="https://github.com/kakaobrain/karlo" rel="nofollow">kakaobrain</a>)</td> <td align="center">Text-to-Image Generation</td></tr> <tr><td><a href="./api/pipelines/versatile_diffusion">versatile_diffusion</a></td> <td><a href="https://arxiv.org/abs/2211.08332" rel="nofollow">Versatile Diffusion: Text, Images and Variations All in One Diffusion Model</a></td> <td align="center">Text-to-Image Generation</td></tr> <tr><td><a href="./api/pipelines/versatile_diffusion">versatile_diffusion</a></td> <td><a href="https://arxiv.org/abs/2211.08332" rel="nofollow">Versatile Diffusion: Text, Images and Variations All in One Diffusion Model</a></td> <td align="center">Image Variations Generation</td></tr> <tr><td><a href="./api/pipelines/versatile_diffusion">versatile_diffusion</a></td> <td><a href="https://arxiv.org/abs/2211.08332" rel="nofollow">Versatile Diffusion: Text, Images and Variations All in One Diffusion Model</a></td> <td align="center">Dual Image and Text Guided Generation</td></tr> <tr><td><a href="./api/pipelines/vq_diffusion">vq_diffusion</a></td> <td><a href="https://arxiv.org/abs/2111.14822" rel="nofollow">Vector Quantized Diffusion Model for Text-to-Image Synthesis</a></td> <td align="center">Text-to-Image Generation</td></tr></tbody>',P,v,k;return p=new Y({props:{title:"🧨 Diffusers",local:"-diffusers",headingTag:"h1"}}),c=new Y({props:{title:"🧨 Diffusers pipelines",local:"-diffusers-pipelines",headingTag:"h2"}}),{c(){l=d("meta"),w=n(),x=d("p"),I=n(),s=d("p"),s.innerHTML=H,y=n(),B(p.$$.fragment),G=n(),u=d("p"),u.innerHTML=$,D=n(),g=d("p"),g.textContent=U,T=n(),h=d("ul"),h.innerHTML=R,M=n(),f=d("div"),f.innerHTML=V,S=n(),B(c.$$.fragment),L=n(),m=d("p"),m.textContent=q,C=n(),b=d("table"),b.innerHTML=z,P=n(),v=d("p"),this.h()},l(e){const t=te("svelte-u9bgzb",document.head);l=r(t,"META",{name:!0,content:!0}),t.forEach(i),w=o(e),x=r(e,"P",{}),F(x).forEach(i),I=o(e),s=r(e,"P",{align:!0,"data-svelte-h":!0}),_(s)!=="svelte-aksdn0"&&(s.innerHTML=H),y=o(e),O(p.$$.fragment,e),G=o(e),u=r(e,"P",{"data-svelte-h":!0}),_(u)!=="svelte-7h3gty"&&(u.innerHTML=$),D=o(e),g=r(e,"P",{"data-svelte-h":!0}),_(g)!=="svelte-f0h4hq"&&(g.textContent=U),T=o(e),h=r(e,"UL",{"data-svelte-h":!0}),_(h)!=="svelte-qatawh"&&(h.innerHTML=R),M=o(e),f=r(e,"DIV",{class:!0,"data-svelte-h":!0}),_(f)!=="svelte-1kh56sb"&&(f.innerHTML=V),S=o(e),O(c.$$.fragment,e),L=o(e),m=r(e,"P",{"data-svelte-h":!0}),_(m)!=="svelte-q0dceg"&&(m.textContent=q),C=o(e),b=r(e,"TABLE",{"data-svelte-h":!0}),_(b)!=="svelte-roh3l2"&&(b.innerHTML=z),P=o(e),v=r(e,"P",{}),F(v).forEach(i),this.h()},h(){A(l,"name","hf:doc:metadata"),A(l,"content",ne),A(s,"align","center"),A(f,"class","mt-10")},m(e,t){ie(document.head,l),a(e,w,t),a(e,x,t),a(e,I,t),a(e,s,t),a(e,y,t),j(p,e,t),a(e,G,t),a(e,u,t),a(e,D,t),a(e,g,t),a(e,T,t),a(e,h,t),a(e,M,t),a(e,f,t),a(e,S,t),j(c,e,t),a(e,L,t),a(e,m,t),a(e,C,t),a(e,b,t),a(e,P,t),a(e,v,t),k=!0},p:J,i(e){k||(Q(p.$$.fragment,e),Q(c.$$.fragment,e),k=!0)},o(e){N(p.$$.fragment,e),N(c.$$.fragment,e),k=!1},d(e){e&&(i(w),i(x),i(I),i(s),i(y),i(G),i(u),i(D),i(g),i(T),i(h),i(M),i(f),i(S),i(L),i(m),i(C),i(b),i(P),i(v)),i(l),W(p,e),W(c,e)}}}const ne='{"title":"🧨 Diffusers","local":"-diffusers","sections":[{"title":"🧨 Diffusers pipelines","local":"-diffusers-pipelines","sections":[],"depth":2}],"depth":1}';function oe(E){return K(()=>{new URLSearchParams(window.location.search).get("fw")}),[]}class se extends X{constructor(l){super(),ee(this,l,oe,ae,Z,{})}}export{se as component};

Xet Storage Details

Size:
17.3 kB
·
Xet hash:
c1e443a66d062ba63ef61a0e9b5eb07f7ac2e2d7f2b6d5493f5d712919171ddc

Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.