Buckets:
| import{s as ci,n as di,o as mi}from"../chunks/scheduler.f3b1e791.js";import{S as ui,i as hi,e as a,s as i,c as p,h as fi,a as o,d as l,b as s,f as pi,g as c,j as r,k as nn,l as Ti,m as n,n as d,t as m,o as u,p as h}from"../chunks/index.023a9934.js";import{C as yi}from"../chunks/CopyLLMTxtMenu.c780467c.js";import{C as T}from"../chunks/CodeBlock.fc650646.js";import{H as f,E as bi}from"../chunks/MermaidChart.svelte_svelte_type_style_lang.fb377ec3.js";function Mi(sn){let y,ct,rt,dt,M,mt,k,ut,g,ht,w,an=`The Kernel Hub allows Python libraries and applications to load compute | |
| kernels directly from the <a href="https://hf.co/" rel="nofollow">Hub</a>. To support this kind | |
| of dynamic loading, Hub kernels differ from traditional Python kernel | |
| packages in that they are made to be:`,ft,$,on=`<li>Portable: a kernel can be loaded from paths outside <code>PYTHONPATH</code>.</li> <li>Unique: multiple versions of the same kernel can be loaded in the | |
| same Python process.</li> <li>Compatible: kernels must support all recent versions of Python and | |
| the different PyTorch build configurations (various CUDA versions | |
| and C++ ABIs). Furthermore, older C library versions must be supported.</li>`,Tt,U,rn=`<code>kernel-builder</code> is a set of tools that can build conforming kernels. It | |
| takes care of:`,yt,J,pn=`<li>Building kernels for all supported PyTorch configurations (C++98/11 and | |
| different CUDA versions).</li> <li>Compatibility with old glibc and libstdc++ versions, so that kernels also | |
| work on older Linux distributions.</li> <li>Registering Torch ops, such that multiple versions the same kernel can be | |
| loaded without namespace conflicts.</li>`,bt,C,cn=`<code>kernel-builder</code> builds are configured through a <code>build.toml</code> file. | |
| <code>build.toml</code> is a simple format that does not require intricate knowledge | |
| of CMake or setuptools.`,Mt,j,dn=`This page describes the directory layout of a kernel-builder project, the | |
| format of the <code>build.toml</code> file, and some additional Python glue that | |
| <code>kernel-builder</code> provides. We will use a <a href="https://github.com/huggingface/kernels/tree/main/examples/kernels/relu" rel="nofollow">simple ReLU kernel</a> | |
| as the running example. After reading this page, you may also want to have | |
| a look at the more realistic <a href="https://github.com/huggingface/kernels/tree/main/examples/kernels/relu-backprop-compile" rel="nofollow">ReLU kernel with backprop and <code>torch.compile</code></a> | |
| support.`,kt,b,mn=`<p>We maintain a set of conforming kernels in the | |
| <a href="https://github.com/huggingface/kernels-community" rel="nofollow">kernels-community repository</a>. | |
| We try to keep these kernels synced with upstream as much as possible.</p>`,gt,v,wt,x,$t,I,un=`The fastest way to get started is to run the install script. This | |
| installs <a href="https://docs.determinate.systems/determinate-nix/" rel="nofollow">Determinate Nix</a> | |
| and <code>kernel-builder</code> in a single command:`,Ut,_,Jt,H,hn="This will:",Ct,L,fn=`<li>Install Determinate Nix (if not already installed).</li> <li>Configure the Hugging Face binary cache (to avoid building dependencies from | |
| source).</li> <li>Install <code>kernel-builder</code> via <code>nix profile install</code>.</li>`,jt,Z,Tn="To update <code>kernel-builder</code> later:",vt,V,xt,B,yn=`For a step-by-step breakdown of what the script does, see | |
| <a href="nix">Using the kernel builder with Nix</a>.`,It,N,_t,R,bn=`In the <a href="https://github.com/huggingface/kernels/tree/main/terraform" rel="nofollow"><code>terraform</code></a> directory, we provide an | |
| example of programatically spinning up an EC2 instance that is ready | |
| with everything needed for you to start developing and building | |
| kernels.`,Ht,W,Mn=`If you use a different provider, the Terraform bridges should be | |
| similar and straightforward to modify.`,Lt,Q,Zt,E,kn=`The easiest way to start a new kernel is by using the <code>init</code> subcommand | |
| of <code>kernel-builder</code>. This creates a minimal, compilable kernel:`,Vt,A,Bt,X,gn=`This creates a kernel named <code>mykernel</code> in the directory <code>mykernel</code>. The | |
| kernel is configured to upload to the <code>myorg/mykernel</code> Hub | |
| repository when an upload command is used.`,Nt,S,wn=`By default, the <code>init</code> subcommand creates a CUDA kernel. You can specify | |
| another backend with the <code>--backends</code> option:`,Rt,G,Wt,q,$n=`You can also make a multi-backend kernel by adding all the backends | |
| that you would like to support as arguments to <code>--backends</code>:`,Qt,P,Et,Y,Un=`Finally, if you want to create a kernel for all supported backends, you | |
| can use <code>--backends all</code>.`,At,F,Xt,O,Jn="Kernel projects follow this general directory layout:",St,z,Gt,D,Cn="In this example we can find:",qt,K,jn=`<li>The build configuration in <code>build.toml</code>.</li> <li>One or more top-level directories containing kernels (<code>mykernel_cuda</code>).</li> <li>The <code>torch-ext</code> directory, which contains: | |
| <ul><li><code>torch_binding.h</code>: contains declarations for kernel entry points | |
| (from <code>kernel_a</code> and <code>kernel_b</code>).</li> <li><code>torch_binding.cpp</code>: registers the entry points as Torch ops.</li> <li><code>torch_ext/mykernel</code>: contains any Python wrapping the kernel needs. At the | |
| bare minimum, it should contain an <code>__init__.py</code> file.</li></ul></li> <li>Kernel tests in the directory <code>tests</code>.</li> <li>Benchmarks in the directory <code>benchmarks</code>.</li> <li>A kernel card template in <code>CARD.md</code>. This placeholders in the card are filled | |
| during the kernel build.</li> <li>The Nix flake configuration in <code>flake.nix</code>.</li> <li>An example script that uses the kernel in <code>example.py</code>.</li>`,Pt,ee,Yt,te,vn=`<code>build.toml</code> tells <code>kernel-builder</code> what to build and how. It looks as | |
| follows for the <code>mykernel</code> kernel:`,Ft,le,Ot,ne,xn="The following sections enumerate all supported options for <code>build.toml</code>.",zt,ie,Dt,se,In=`<li><code>name</code> (required): the name of the kernel. The Python code for a Torch | |
| extension must be stored in <code>torch-ext/<name></code>.</li> <li><code>version</code> (int): the major version of the kernel. | |
| The version is written to the kernel’s <code>metadata.json</code> and is used | |
| by the <code>kernels upload</code> command to upload the kernel to a version | |
| branch named <code>v<version></code>.</li> <li><code>backends</code> (required): a list of supported backends. Must be one or | |
| more of <code>cpu</code>, <code>cuda</code>, <code>metal</code>, <code>rocm</code>, or <code>xpu</code>.</li> <li><code>python-depends</code> (<strong>experimental</strong>): a list of additional Python dependencies | |
| that the kernel requires. The only supported dependencies are <code>einops</code> | |
| and <code>nvidia-cutlass-dsl</code>.</li>`,Kt,ae,el,oe,_n=`<li><code>repo-id</code>: the Hub repository to upload the kernel to when the <code>upload</code> or | |
| <code>build-and-upload</code> subcommands of <code>kernel-builder</code> are used.</li>`,tl,re,ll,pe,Hn=`<li><code>maxver</code>: the maximum CUDA toolkit version (inclusive). This option | |
| <em>must not</em> be set under normal circumstances, since it can exclude Torch | |
| build variants that are <a href="../kernel-requirements">required for compliant kernels</a>. | |
| This option is provided for kernels that cause compiler errors on | |
| newer CUDA toolkit versions.</li> <li><code>minver</code>: the minimum required CUDA toolkit version. This option | |
| <em>must not</em> be set under normal circumstances, since it can exclude Torch | |
| build variants that are <a href="../kernel-requirements">required for compliant kernels</a>. | |
| This option is provided for kernels that require functionality only | |
| provided by newer CUDA toolkits.</li>`,nl,ce,il,de,Ln=`This section describes the Torch extension. In the future, there may be | |
| similar sections for other frameworks. This section has the following | |
| options:`,sl,me,Zn=`<li><code>src</code> (required): a list of source files and headers.</li> <li><code>pyext</code> (optional): the list of extensions for Python files. Default: | |
| <code>["py", "pyi"]</code>.</li> <li><code>include</code> (optional): include directories relative to the project root. | |
| Default: <code>[]</code>.</li> <li><code>maxver</code> (optional): only build for this Torch version and earlier. Use cautiously, since this option produces | |
| non-compliant kernels if the version range does not correspond to the <a href="build-variants">required variants</a>.</li> <li><code>minver</code> (optional): only build for this Torch version and later. Use cautiously, since this option produces | |
| non-compliant kernels if the version range does not correspond to the <a href="build-variants">required variants</a>.</li> <li><code>stable-abi</code> (<strong>experimental</strong>): when set to a Torch version (e.g. | |
| <code>"2.11"</code>), the kernel is built using the Torch stable ABI. This | |
| requires that the kernel itself only use | |
| <a href="https://docs.pytorch.org/docs/2.12/notes/libtorch_stable_abi.html" rel="nofollow">stable ABI headers</a>. | |
| For an example, see the <a href="https://github.com/huggingface/kernels/tree/main/examples/kernels/relu-torch-stable-abi" rel="nofollow"><code>relu-torch-stable-abi</code></a> | |
| example kernel.</li>`,al,ue,ol,he,Vn=`Specification of a kernel with the name <code><name></code>. Multiple <code>kernel.<name></code> | |
| sections can be defined in the same <code>build.toml</code>. | |
| See for example <a href="https://huggingface.co/kernels-community/quantization/" rel="nofollow"><code>kernels-community/quantization</code></a> | |
| for an example with multiple kernel sections.`,rl,fe,Bn="The following options can be set for a kernel:",pl,Te,Nn=`<li><code>backend</code> (required): the compute backend of the kernel. The currently | |
| supported backends are <code>cpu</code>, <code>cuda</code>, <code>metal</code>, <code>rocm</code>, and <code>xpu</code>. | |
| <strong>The <code>cpu</code> backend is currently experimental and might still change.</strong></li> <li><code>depends</code> (required): a list of dependencies. The supported dependencies | |
| are listed in <a href="https://github.com/huggingface/kernels/blob/main/builder/lib/deps.nix" rel="nofollow"><code>deps.nix</code></a>.</li> <li><code>src</code> (required): a list of source files and headers.</li> <li><code>include</code> (optional): include directories relative to the project root. | |
| Default: <code>[]</code>.</li>`,cl,ye,Rn=`Besides these shared options, the following backend-specific options | |
| are available:`,dl,be,ml,Me,Wn=`<li><code>cuda-capabilities</code> (optional): a list of CUDA capabilities that the | |
| kernel should be compiled for. When absent, the kernel will be built | |
| using all capabilities that the builder supports. The effective | |
| capabilities are the intersection of this list and the capabilities | |
| supported by the CUDA compiler. It is recommended to leave this option | |
| unspecified <strong>unless</strong> a kernel requires specific capabilities.</li> <li><code>cuda-flags</code> (optional): additional flags to be passed to <code>nvcc</code>. | |
| <strong>Warning</strong>: this option should only be used in exceptional circumstances. | |
| Custom compile flags can interfere with the build process or break | |
| compatibility requirements.</li>`,ul,ke,hl,ge,Qn=`<li><code>rocm-archs</code>: a list of ROCm architectures that the kernel should be | |
| compiled for.</li>`,fl,we,Tl,$e,En=`<li><code>sycl-flags</code>: a list of additional flags to be passed to the SYCL | |
| compiler.</li>`,yl,Ue,bl,Je,An=`<li><code>cxx-flags</code>: a list of additional flags to be passed to the C++ | |
| compiler.</li>`,Ml,Ce,kl,je,gl,ve,Xn="Torch bindings are defined in C++, kernels commonly use two files:",wl,xe,Sn="<li><code>torch_binding.h</code> containing function declarations.</li> <li><code>torch_binding.cpp</code> registering the functions as Torch ops.</li>",$l,Ie,Gn=`For instance, the <code>mykernel</code> kernel discussed above has the following | |
| declaration in <code>torch_binding.h</code>:`,Ul,_e,Jl,He,qn="This function is then registered as a Torch op in <code>torch_binding.cpp</code>:",Cl,Le,jl,Ze,Pn=`This snippet uses macros from <code>registration.h</code> to register the function. | |
| <code>registration.h</code> is generated by <code>kernel-builder</code> itself. A function | |
| is registered through the <code>def</code>/<code>ops</code> methods. <code>ops</code> specifies the | |
| function signature following the <a href="https://github.com/pytorch/pytorch/blob/main/aten/src/ATen/native/README.md#func" rel="nofollow">function schema</a>. | |
| <code>impl</code> associates the function name with the C/C++ function and | |
| the applicable device.`,vl,Ve,xl,Be,Yn=`The bindings are typically wrapped in Python code in <code>torch_ext/<name></code>. | |
| The native code is exposed under the <code>torch.ops</code> namespace. However, | |
| we add some unique material to the name of the extension to ensure that | |
| different versions of the same extension can be loaded at the same time. | |
| As a result, the extension is registered as | |
| <code>torch.ops.<name>_<unique_material></code>.`,Il,Ne,Fn=`To deal with this uniqueness, <code>kernel_builder</code> generates a Python module | |
| named <code>_ops</code> that contains an alias for the name. This can be used to | |
| refer to the correct <code>torch.ops</code> module. For example:`,_l,Re,Hl,We,Ll,Qe,On=`You may want to register Torch ops from your kernel’s Python code or | |
| register fake ops for <code>torch.compile</code> support. It is important to register | |
| such ops in the namespace that kernel-builder makes for your kernel | |
| build. This is required for compliant kernels to ensure that multiple | |
| versions of the same kernel can be loaded at the same time without | |
| namespace conflicts.`,Zl,Ee,zn=`You can use the <code>add_op_namespace_prefix</code> to prefix an op name with the | |
| correct prefix. So for instance, replace`,Vl,Ae,Bl,Xe,Dn="by",Nl,Se,Rl,Ge,Kn="As mentioned in the above, the <code>_ops</code> module is generated by kernel-builder.",Wl,qe,ei=`kernel-builder uses a hook to reject incorrect usage of Torch op registration | |
| functions. However, it can only catch direct use of certain <code>torch.library</code> | |
| decorators. For instance, the hook would not reject the following decorator, | |
| so it should be seen as a last-resort check if human review failed:`,Ql,Pe,El,Ye,Al,Fe,ti=`Kernel tests are stored in the <code>tests</code> directory. Since running all | |
| kernel tests in CI may be prohibitively expensive, the <code>pyproject.toml</code> | |
| generated by the builder adds support for the special <code>kernels_ci</code> | |
| PyTest marker that can be used as follows:`,Xl,Oe,Sl,ze,li=`We recommend that you to pick tests that together would catch most error | |
| cases while running within 60 seconds.`,Gl,De,ni="You can run the tests (e.g. in CI) using:",ql,Ke,Pl,et,ii=`If the kernel supports multiple backends, it will run the test for the | |
| first supported backend that was found, obeying the following order: CUDA, | |
| ROCm, XPU, Metal, CPU. If you would like to the tests for a specific build | |
| variant, you can use <code>nix run .#ciTests.<variant></code>. For instance:`,Yl,tt,Fl,lt,si=`When running the tests on a non-NixOS systems, make sure that | |
| <a href="https://danieldk.eu/Software/Nix/Nix-CUDA-on-non-NixOS-systems#solutions" rel="nofollow">the CUDA driver library can be found</a>.`,Ol,nt,zl,it,ai=`We provide a utility to generate a system card for a given kernel, utilizing | |
| information from its <code>build.toml</code> and metadata. This system card provides a | |
| reasonable starting point and is meant to be edited afterward by the kernel | |
| developer.`,Dl,st,oi=`The template card is generated as a part of <code>kernel-builder init</code> | |
| command and is serialized in the root directory of the kernel.`,Kl,at,ri=`The card will be filled automatically by the builder when using the | |
| <code>build-and-upload</code> or <code>build-and-copy</code> command. It will be serialized | |
| to the <code>build</code> sub-directory inside the main kernel directory. It | |
| will be uploaded as <code>README.md</code> to the Hub.`,en,ot,tn,pt,ln;return M=new yi({props:{containerStyle:"float: right; margin-left: 10px; display: inline-flex; position: relative; z-index: 10;"}}),k=new f({props:{title:"Writing Hub kernels with kernel-builder",local:"writing-hub-kernels-with-kernel-builder",headingTag:"h1"}}),g=new f({props:{title:"Introduction",local:"introduction",headingTag:"h2"}}),v=new f({props:{title:"Setting up environment",local:"setting-up-environment",headingTag:"h2"}}),x=new f({props:{title:"Quick install",local:"quick-install",headingTag:"h3"}}),_=new T({props:{code:"Y3VybCUyMC1mc1NMJTIwaHR0cHMlM0ElMkYlMkZyYXcuZ2l0aHVidXNlcmNvbnRlbnQuY29tJTJGaHVnZ2luZ2ZhY2UlMkZrZXJuZWxzJTJGbWFpbiUyRmluc3RhbGwuc2glMjAlN0MlMjBiYXNo",highlighted:"curl -fsSL https://raw.githubusercontent.com/huggingface/kernels/main/install.sh | bash",lang:"bash",wrap:!1}}),V=new T({props:{code:"bml4JTIwcHJvZmlsZSUyMHVwZ3JhZGUlMjAtLWFsbA==",highlighted:"nix profile upgrade --all",lang:"bash",wrap:!1}}),N=new f({props:{title:"Cloud environment",local:"cloud-environment",headingTag:"h3"}}),Q=new f({props:{title:"Starting a new kernel",local:"starting-a-new-kernel",headingTag:"h2"}}),A=new T({props:{code:"JTI0JTIwa2VybmVsLWJ1aWxkZXIlMjBpbml0JTIwLS1uYW1lJTIwbXlvcmclMkZteWtlcm5lbCUwQUluaXRpYWxpemVkJTIwJTYwbXlvcmclMkZteWtlcm5lbCU2MCUyMGF0JTIwJTJGaG9tZSUyRmRhbmllbCUyRmdpdCUyRmtlcm5lbHMlMkZleGFtcGxlcyUyRmtlcm5lbHMlMkZteWtlcm5lbA==",highlighted:"$ kernel-builder init --name myorg/mykernel\nInitialized `myorg/mykernel` at /home/daniel/git/kernels/examples/kernels/mykernel",lang:"bash",wrap:!1}}),G=new T({props:{code:"JTI0JTIwa2VybmVsLWJ1aWxkZXIlMjBpbml0JTIwLS1uYW1lJTIwbXlvcmclMkZteWtlcm5lbCUyMC0tYmFja2VuZHMlMjB4cHU=",highlighted:"$ kernel-builder init --name myorg/mykernel --backends xpu",lang:"bash",wrap:!1}}),P=new T({props:{code:"JTI0JTIwa2VybmVsLWJ1aWxkZXIlMjBpbml0JTIwLS1uYW1lJTIwbXlvcmclMkZteWtlcm5lbCUyMC0tYmFja2VuZHMlMjBjdWRhJTIweHB1JTBBSW5pdGlhbGl6ZWQlMjAlNjBteW9yZyUyRm15a2VybmVsJTYwJTIwYXQlMjAlMkZob21lJTJGZGFuaWVsJTJGZ2l0JTJGa2VybmVscyUyRmV4YW1wbGVzJTJGa2VybmVscyUyRm15a2VybmVs",highlighted:"$ kernel-builder init --name myorg/mykernel --backends cuda xpu\nInitialized `myorg/mykernel` at /home/daniel/git/kernels/examples/kernels/mykernel",lang:"bash",wrap:!1}}),F=new f({props:{title:"Kernel project layout",local:"kernel-project-layout",headingTag:"h2"}}),z=new T({props:{code:"bXlrZXJuZWwlMEElRTIlOTQlOUMlRTIlOTQlODAlRTIlOTQlODAlMjBiZW5jaG1hcmtzJTBBJUUyJTk0JTgyJTIwJTIwJTIwJUUyJTk0JTk0JUUyJTk0JTgwJUUyJTk0JTgwJTIwYmVuY2htYXJrLnB5JTBBJUUyJTk0JTlDJUUyJTk0JTgwJUUyJTk0JTgwJTIwYnVpbGQudG9tbCUwQSVFMiU5NCU5QyVFMiU5NCU4MCVFMiU5NCU4MCUyMENBUkQubWQlMEElRTIlOTQlOUMlRTIlOTQlODAlRTIlOTQlODAlMjBleGFtcGxlLnB5JTBBJUUyJTk0JTlDJUUyJTk0JTgwJUUyJTk0JTgwJTIwZmxha2Uubml4JTBBJUUyJTk0JTlDJUUyJTk0JTgwJUUyJTk0JTgwJTIwbXlrZXJuZWxfY3VkYSUwQSVFMiU5NCU4MiUyMCUyMCUyMCVFMiU5NCU5NCVFMiU5NCU4MCVFMiU5NCU4MCUyMG15a2VybmVsLmN1JTBBJUUyJTk0JTlDJUUyJTk0JTgwJUUyJTk0JTgwJTIwdGVzdHMlMEElRTIlOTQlODIlMjAlMjAlMjAlRTIlOTQlOUMlRTIlOTQlODAlRTIlOTQlODAlMjBfX2luaXRfXy5weSUwQSVFMiU5NCU4MiUyMCUyMCUyMCVFMiU5NCU5NCVFMiU5NCU4MCVFMiU5NCU4MCUyMHRlc3RfbXlrZXJuZWwucHklMEElRTIlOTQlOTQlRTIlOTQlODAlRTIlOTQlODAlMjB0b3JjaC1leHQlMEElRTIlOTQlOUMlRTIlOTQlODAlRTIlOTQlODAlMjBteWtlcm5lbCUwQSVFMiU5NCU4MiUyMCUyMCUyMCVFMiU5NCU5NCVFMiU5NCU4MCVFMiU5NCU4MCUyMF9faW5pdF9fLnB5JTBBJUUyJTk0JTlDJUUyJTk0JTgwJUUyJTk0JTgwJTIwdG9yY2hfYmluZGluZy5jcHAlMEElRTIlOTQlOTQlRTIlOTQlODAlRTIlOTQlODAlMjB0b3JjaF9iaW5kaW5nLmg=",highlighted:`mykernel | |
| ├── benchmarks | |
| │ └── benchmark.py | |
| ├── build.toml | |
| ├── CARD.md | |
| ├── example.py | |
| ├── flake.nix | |
| ├── mykernel_cuda | |
| │ └── mykernel.cu | |
| ├── tests | |
| │ ├── __init__.py | |
| │ └── test_mykernel.py | |
| └── torch-ext | |
| ├── mykernel | |
| │ └── __init__.py | |
| ├── torch_binding.cpp | |
| └── torch_binding.h`,lang:"text",wrap:!1}}),ee=new f({props:{title:"build.toml",local:"buildtoml",headingTag:"h2"}}),le=new T({props:{code:"JTVCZ2VuZXJhbCU1RCUwQWJhY2tlbmRzJTIwJTNEJTIwJTVCJTBBJTIwJTIwJTIyY3VkYSUyMiUyQyUwQSU1RCUwQW5hbWUlMjAlM0QlMjAlMjJteWtlcm5lbCUyMiUwQXZlcnNpb24lMjAlM0QlMjAxJTBBJTBBJTVCZ2VuZXJhbC5odWIlNUQlMEFyZXBvLWlkJTIwJTNEJTIwJTIybXlvcmclMkZteWtlcm5lbCUyMiUwQSUwQSU1QnRvcmNoJTVEJTBBc3JjJTIwJTNEJTIwJTVCJTBBJTIwJTIwJTIydG9yY2gtZXh0JTJGdG9yY2hfYmluZGluZy5jcHAlMjIlMkMlMEElMjAlMjAlMjJ0b3JjaC1leHQlMkZ0b3JjaF9iaW5kaW5nLmglMjIlMkMlMEElNUQlMEElMEElNUJrZXJuZWwubXlrZXJuZWwlNUQlMEFiYWNrZW5kJTIwJTNEJTIwJTIyY3VkYSUyMiUwQWRlcGVuZHMlMjAlM0QlMjAlNUIlMjJ0b3JjaCUyMiU1RCUwQXNyYyUyMCUzRCUyMCU1QiUyMm15a2VybmVsX2N1ZGElMkZteWtlcm5lbC5jdSUyMiU1RCUwQSUyMyUyMElmJTIwdGhlJTIwa2VybmVsJTIwaXMlMjBvbmx5JTIwc3VwcG9ydGVkJTIwb24lMjBzcGVjaWZpYyUyMGNhcGFiaWxpdGllcyUyQyUyMHNldCUyMHRoZSUwQSUyMyUyMGN1ZGEtY2FwYWJpbGl0aWVzJTIwb3B0aW9uJTNBJTBBJTIzJTBBJTIzJTIwY3VkYS1jYXBhYmlsaXRpZXMlMjAlM0QlMjAlNUIlMjAlMjI5LjAlMjIlMkMlMjAlMjIxMC4wJTIyJTJDJTIwJTIyMTIuMCUyMiUyMCU1RA==",highlighted:`<span class="hljs-section">[general]</span> | |
| <span class="hljs-attr">backends</span> = [ | |
| <span class="hljs-string">"cuda"</span>, | |
| ] | |
| <span class="hljs-attr">name</span> = <span class="hljs-string">"mykernel"</span> | |
| <span class="hljs-attr">version</span> = <span class="hljs-number">1</span> | |
| <span class="hljs-section">[general.hub]</span> | |
| <span class="hljs-attr">repo-id</span> = <span class="hljs-string">"myorg/mykernel"</span> | |
| <span class="hljs-section">[torch]</span> | |
| <span class="hljs-attr">src</span> = [ | |
| <span class="hljs-string">"torch-ext/torch_binding.cpp"</span>, | |
| <span class="hljs-string">"torch-ext/torch_binding.h"</span>, | |
| ] | |
| <span class="hljs-section">[kernel.mykernel]</span> | |
| <span class="hljs-attr">backend</span> = <span class="hljs-string">"cuda"</span> | |
| <span class="hljs-attr">depends</span> = [<span class="hljs-string">"torch"</span>] | |
| <span class="hljs-attr">src</span> = [<span class="hljs-string">"mykernel_cuda/mykernel.cu"</span>] | |
| <span class="hljs-comment"># If the kernel is only supported on specific capabilities, set the</span> | |
| <span class="hljs-comment"># cuda-capabilities option:</span> | |
| <span class="hljs-comment">#</span> | |
| <span class="hljs-comment"># cuda-capabilities = [ "9.0", "10.0", "12.0" ]</span>`,lang:"toml",wrap:!1}}),ie=new f({props:{title:"general",local:"general",headingTag:"h3"}}),ae=new f({props:{title:"general.hub",local:"generalhub",headingTag:"h3"}}),re=new f({props:{title:"general.cuda",local:"generalcuda",headingTag:"h3"}}),ce=new f({props:{title:"torch",local:"torch",headingTag:"h3"}}),ue=new f({props:{title:"kernel.<name>",local:"kernelltnamegt",headingTag:"h3"}}),be=new f({props:{title:"cuda",local:"cuda",headingTag:"h4"}}),ke=new f({props:{title:"rocm",local:"rocm",headingTag:"h4"}}),we=new f({props:{title:"xpu",local:"xpu",headingTag:"h4"}}),Ue=new f({props:{title:"cpu",local:"cpu",headingTag:"h3"}}),Ce=new f({props:{title:"Torch bindings",local:"torch-bindings",headingTag:"h2"}}),je=new f({props:{title:"Defining bindings",local:"defining-bindings",headingTag:"h3"}}),_e=new T({props:{code:"JTIzcHJhZ21hJTIwb25jZSUwQSUwQSUyM2luY2x1ZGUlMjAlM0N0b3JjaCUyRnRvcmNoLmglM0UlMEElMEF2b2lkJTIwbXlrZXJuZWwodG9yY2glM0ElM0FUZW5zb3IlMjAlMjZvdXQlMkMlMjB0b3JjaCUzQSUzQVRlbnNvciUyMGNvbnN0JTIwJTI2aW5wdXQpJTNC",highlighted:`<span class="hljs-meta">#<span class="hljs-keyword">pragma</span> once</span> | |
| <span class="hljs-meta">#<span class="hljs-keyword">include</span> <span class="hljs-string"><torch/torch.h></span></span> | |
| <span class="hljs-function"><span class="hljs-type">void</span> <span class="hljs-title">mykernel</span><span class="hljs-params">(torch::Tensor &out, torch::Tensor <span class="hljs-type">const</span> &input)</span></span>;`,lang:"cpp",wrap:!1}}),Le=new T({props:{code:"JTIzaW5jbHVkZSUyMCUzQ3RvcmNoJTJGbGlicmFyeS5oJTNFJTBBJTBBJTIzaW5jbHVkZSUyMCUyMnJlZ2lzdHJhdGlvbi5oJTIyJTBBJTIzaW5jbHVkZSUyMCUyMnRvcmNoX2JpbmRpbmcuaCUyMiUwQSUwQVRPUkNIX0xJQlJBUllfRVhQQU5EKFRPUkNIX0VYVEVOU0lPTl9OQU1FJTJDJTIwb3BzKSUyMCU3QiUwQSUyMCUyMG9wcy5kZWYoJTIybXlrZXJuZWwoVGVuc29yISUyMG91dCUyQyUyMFRlbnNvciUyMGlucHV0KSUyMC0lM0UlMjAoKSUyMiklM0IlMEElMjNpZiUyMGRlZmluZWQoQ1VEQV9LRVJORUwpJTIwJTdDJTdDJTIwZGVmaW5lZChST0NNX0tFUk5FTCklMEElMjAlMjBvcHMuaW1wbCglMjJteWtlcm5lbCUyMiUyQyUyMHRvcmNoJTNBJTNBa0NVREElMkMlMjAlMjZteWtlcm5lbCklM0IlMEElMjNlbmRpZiUwQSU3RCUwQSUwQVJFR0lTVEVSX0VYVEVOU0lPTihUT1JDSF9FWFRFTlNJT05fTkFNRSk=",highlighted:`<span class="hljs-meta">#<span class="hljs-keyword">include</span> <span class="hljs-string"><torch/library.h></span></span> | |
| <span class="hljs-meta">#<span class="hljs-keyword">include</span> <span class="hljs-string">"registration.h"</span></span> | |
| <span class="hljs-meta">#<span class="hljs-keyword">include</span> <span class="hljs-string">"torch_binding.h"</span></span> | |
| <span class="hljs-built_in">TORCH_LIBRARY_EXPAND</span>(TORCH_EXTENSION_NAME, ops) { | |
| ops.<span class="hljs-built_in">def</span>(<span class="hljs-string">"mykernel(Tensor! out, Tensor input) -> ()"</span>); | |
| <span class="hljs-meta">#<span class="hljs-keyword">if</span> defined(CUDA_KERNEL) || defined(ROCM_KERNEL)</span> | |
| ops.<span class="hljs-built_in">impl</span>(<span class="hljs-string">"mykernel"</span>, torch::kCUDA, &mykernel); | |
| <span class="hljs-meta">#<span class="hljs-keyword">endif</span></span> | |
| } | |
| <span class="hljs-built_in">REGISTER_EXTENSION</span>(TORCH_EXTENSION_NAME)`,lang:"cpp",wrap:!1}}),Ve=new f({props:{title:"Using kernel functions from Python",local:"using-kernel-functions-from-python",headingTag:"h2"}}),Re=new T({props:{code:"ZnJvbSUyMHR5cGluZyUyMGltcG9ydCUyME9wdGlvbmFsJTBBJTBBaW1wb3J0JTIwdG9yY2glMEElMEFmcm9tJTIwLl9vcHMlMjBpbXBvcnQlMjBvcHMlMEElMEElMEFkZWYlMjBteWtlcm5lbCh4JTNBJTIwdG9yY2guVGVuc29yJTJDJTIwb3V0JTNBJTIwT3B0aW9uYWwlNUJ0b3JjaC5UZW5zb3IlNUQlMjAlM0QlMjBOb25lKSUyMC0lM0UlMjB0b3JjaC5UZW5zb3IlM0ElMEElMjAlMjAlMjAlMjBpZiUyMG91dCUyMGlzJTIwTm9uZSUzQSUwQSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMG91dCUyMCUzRCUyMHRvcmNoLmVtcHR5X2xpa2UoeCklMEElMjAlMjAlMjAlMjBvcHMubXlrZXJuZWwob3V0JTJDJTIweCklMEElMjAlMjAlMjAlMjByZXR1cm4lMjBvdXQ=",highlighted:`<span class="hljs-keyword">from</span> typing <span class="hljs-keyword">import</span> <span class="hljs-type">Optional</span> | |
| <span class="hljs-keyword">import</span> torch | |
| <span class="hljs-keyword">from</span> ._ops <span class="hljs-keyword">import</span> ops | |
| <span class="hljs-keyword">def</span> <span class="hljs-title function_">mykernel</span>(<span class="hljs-params">x: torch.Tensor, out: <span class="hljs-type">Optional</span>[torch.Tensor] = <span class="hljs-literal">None</span></span>) -> torch.Tensor: | |
| <span class="hljs-keyword">if</span> out <span class="hljs-keyword">is</span> <span class="hljs-literal">None</span>: | |
| out = torch.empty_like(x) | |
| ops.mykernel(out, x) | |
| <span class="hljs-keyword">return</span> out`,lang:"python",wrap:!1}}),We=new f({props:{title:"Registering Torch operators",local:"registering-torch-operators",headingTag:"h2"}}),Ae=new T({props:{code:"JTQwdG9yY2gubGlicmFyeS5yZWdpc3Rlcl9mYWtlKCUyMnJlbHUlM0ElM0FyZWx1X2Z3ZCUyMiklMEFkZWYlMjByZWx1X2Z3ZF9mYWtlKGlucHV0JTNBJTIwdG9yY2guVGVuc29yKSUyMC0lM0UlMjB0b3JjaC5UZW5zb3IlM0ElMEElMjAlMjAlMjAlMjByZXR1cm4lMjB0b3JjaC5lbXB0eV9saWtlKGlucHV0KQ==",highlighted:`<span class="hljs-meta">@torch.library.register_fake(<span class="hljs-params"><span class="hljs-string">"relu::relu_fwd"</span></span>)</span> | |
| <span class="hljs-keyword">def</span> <span class="hljs-title function_">relu_fwd_fake</span>(<span class="hljs-params"><span class="hljs-built_in">input</span>: torch.Tensor</span>) -> torch.Tensor: | |
| <span class="hljs-keyword">return</span> torch.empty_like(<span class="hljs-built_in">input</span>)`,lang:"python",wrap:!1}}),Se=new T({props:{code:"ZnJvbSUyMC5fb3BzJTIwaW1wb3J0JTIwYWRkX29wX25hbWVzcGFjZV9wcmVmaXglMEElMEElNDB0b3JjaC5saWJyYXJ5LnJlZ2lzdGVyX2Zha2UoYWRkX29wX25hbWVzcGFjZV9wcmVmaXgoJTIycmVsdV9md2QlMjIpKSUwQWRlZiUyMHJlbHVfZndkX2Zha2UoaW5wdXQlM0ElMjB0b3JjaC5UZW5zb3IpJTIwLSUzRSUyMHRvcmNoLlRlbnNvciUzQSUwQSUyMCUyMCUyMCUyMHJldHVybiUyMHRvcmNoLmVtcHR5X2xpa2UoaW5wdXQp",highlighted:`<span class="hljs-keyword">from</span> ._ops <span class="hljs-keyword">import</span> add_op_namespace_prefix | |
| <span class="hljs-meta">@torch.library.register_fake(<span class="hljs-params">add_op_namespace_prefix(<span class="hljs-params"><span class="hljs-string">"relu_fwd"</span></span>)</span>)</span> | |
| <span class="hljs-keyword">def</span> <span class="hljs-title function_">relu_fwd_fake</span>(<span class="hljs-params"><span class="hljs-built_in">input</span>: torch.Tensor</span>) -> torch.Tensor: | |
| <span class="hljs-keyword">return</span> torch.empty_like(<span class="hljs-built_in">input</span>)`,lang:"python",wrap:!1}}),Pe=new T({props:{code:"JTQwc29tZV9pbmRpcmVjdGlvbl9mb3JfcmVnaXN0ZXJfZmFrZSglMjJyZWx1JTNBJTNBcmVsdV9md2QlMjIpJTBBZGVmJTIwcmVsdV9md2RfZmFrZShpbnB1dCUzQSUyMHRvcmNoLlRlbnNvciklMjAtJTNFJTIwdG9yY2guVGVuc29yJTNBJTBBJTIwJTIwJTIwJTIwcmV0dXJuJTIwdG9yY2guZW1wdHlfbGlrZShpbnB1dCk=",highlighted:`<span class="hljs-meta">@some_indirection_for_register_fake(<span class="hljs-params"><span class="hljs-string">"relu::relu_fwd"</span></span>)</span> | |
| <span class="hljs-keyword">def</span> <span class="hljs-title function_">relu_fwd_fake</span>(<span class="hljs-params"><span class="hljs-built_in">input</span>: torch.Tensor</span>) -> torch.Tensor: | |
| <span class="hljs-keyword">return</span> torch.empty_like(<span class="hljs-built_in">input</span>)`,lang:"python",wrap:!1}}),Ye=new f({props:{title:"Kernel tests",local:"kernel-tests",headingTag:"h2"}}),Oe=new T({props:{code:"aW1wb3J0JTIwcHl0ZXN0JTBBJTBBJTQwcHl0ZXN0Lm1hcmsua2VybmVsc19jaSUwQWRlZiUyMHRlc3RfbXlrZXJuZWwoKSUzQSUwQSUyMCUyMC4uLg==",highlighted:`<span class="hljs-keyword">import</span> pytest | |
| <span class="hljs-meta">@pytest.mark.kernels_ci</span> | |
| <span class="hljs-keyword">def</span> <span class="hljs-title function_">test_mykernel</span>(): | |
| ...`,lang:"python",wrap:!1}}),Ke=new T({props:{code:"JTI0JTIwbml4JTIwcnVuJTIwLiUyM2NpLXRlc3Q=",highlighted:'$ nix run .<span class="hljs-comment">#ci-test</span>',lang:"bash",wrap:!1}}),tt=new T({props:{code:"JTI0JTIwbml4JTIwcnVuJTIwLiUyM2NpVGVzdHMudG9yY2gyMTAtY3h4MTEtY3B1LXg4Nl82NC1saW51eA==",highlighted:'$ nix run .<span class="hljs-comment">#ciTests.torch210-cxx11-cpu-x86_64-linux</span>',lang:"bash",wrap:!1}}),nt=new f({props:{title:"Kernel docs",local:"kernel-docs",headingTag:"h2"}}),ot=new bi({props:{source:"https://github.com/huggingface/kernels/blob/main/docs/source/builder/writing-kernels.md"}}),{c(){y=a("meta"),ct=i(),rt=a("p"),dt=i(),p(M.$$.fragment),mt=i(),p(k.$$.fragment),ut=i(),p(g.$$.fragment),ht=i(),w=a("p"),w.innerHTML=an,ft=i(),$=a("ul"),$.innerHTML=on,Tt=i(),U=a("p"),U.innerHTML=rn,yt=i(),J=a("ul"),J.innerHTML=pn,bt=i(),C=a("p"),C.innerHTML=cn,Mt=i(),j=a("p"),j.innerHTML=dn,kt=i(),b=a("blockquote"),b.innerHTML=mn,gt=i(),p(v.$$.fragment),wt=i(),p(x.$$.fragment),$t=i(),I=a("p"),I.innerHTML=un,Ut=i(),p(_.$$.fragment),Jt=i(),H=a("p"),H.textContent=hn,Ct=i(),L=a("ol"),L.innerHTML=fn,jt=i(),Z=a("p"),Z.innerHTML=Tn,vt=i(),p(V.$$.fragment),xt=i(),B=a("p"),B.innerHTML=yn,It=i(),p(N.$$.fragment),_t=i(),R=a("p"),R.innerHTML=bn,Ht=i(),W=a("p"),W.textContent=Mn,Lt=i(),p(Q.$$.fragment),Zt=i(),E=a("p"),E.innerHTML=kn,Vt=i(),p(A.$$.fragment),Bt=i(),X=a("p"),X.innerHTML=gn,Nt=i(),S=a("p"),S.innerHTML=wn,Rt=i(),p(G.$$.fragment),Wt=i(),q=a("p"),q.innerHTML=$n,Qt=i(),p(P.$$.fragment),Et=i(),Y=a("p"),Y.innerHTML=Un,At=i(),p(F.$$.fragment),Xt=i(),O=a("p"),O.textContent=Jn,St=i(),p(z.$$.fragment),Gt=i(),D=a("p"),D.textContent=Cn,qt=i(),K=a("ul"),K.innerHTML=jn,Pt=i(),p(ee.$$.fragment),Yt=i(),te=a("p"),te.innerHTML=vn,Ft=i(),p(le.$$.fragment),Ot=i(),ne=a("p"),ne.innerHTML=xn,zt=i(),p(ie.$$.fragment),Dt=i(),se=a("ul"),se.innerHTML=In,Kt=i(),p(ae.$$.fragment),el=i(),oe=a("ul"),oe.innerHTML=_n,tl=i(),p(re.$$.fragment),ll=i(),pe=a("ul"),pe.innerHTML=Hn,nl=i(),p(ce.$$.fragment),il=i(),de=a("p"),de.textContent=Ln,sl=i(),me=a("ul"),me.innerHTML=Zn,al=i(),p(ue.$$.fragment),ol=i(),he=a("p"),he.innerHTML=Vn,rl=i(),fe=a("p"),fe.textContent=Bn,pl=i(),Te=a("ul"),Te.innerHTML=Nn,cl=i(),ye=a("p"),ye.textContent=Rn,dl=i(),p(be.$$.fragment),ml=i(),Me=a("ul"),Me.innerHTML=Wn,ul=i(),p(ke.$$.fragment),hl=i(),ge=a("ul"),ge.innerHTML=Qn,fl=i(),p(we.$$.fragment),Tl=i(),$e=a("ul"),$e.innerHTML=En,yl=i(),p(Ue.$$.fragment),bl=i(),Je=a("ul"),Je.innerHTML=An,Ml=i(),p(Ce.$$.fragment),kl=i(),p(je.$$.fragment),gl=i(),ve=a("p"),ve.textContent=Xn,wl=i(),xe=a("ul"),xe.innerHTML=Sn,$l=i(),Ie=a("p"),Ie.innerHTML=Gn,Ul=i(),p(_e.$$.fragment),Jl=i(),He=a("p"),He.innerHTML=qn,Cl=i(),p(Le.$$.fragment),jl=i(),Ze=a("p"),Ze.innerHTML=Pn,vl=i(),p(Ve.$$.fragment),xl=i(),Be=a("p"),Be.innerHTML=Yn,Il=i(),Ne=a("p"),Ne.innerHTML=Fn,_l=i(),p(Re.$$.fragment),Hl=i(),p(We.$$.fragment),Ll=i(),Qe=a("p"),Qe.innerHTML=On,Zl=i(),Ee=a("p"),Ee.innerHTML=zn,Vl=i(),p(Ae.$$.fragment),Bl=i(),Xe=a("p"),Xe.textContent=Dn,Nl=i(),p(Se.$$.fragment),Rl=i(),Ge=a("p"),Ge.innerHTML=Kn,Wl=i(),qe=a("p"),qe.innerHTML=ei,Ql=i(),p(Pe.$$.fragment),El=i(),p(Ye.$$.fragment),Al=i(),Fe=a("p"),Fe.innerHTML=ti,Xl=i(),p(Oe.$$.fragment),Sl=i(),ze=a("p"),ze.textContent=li,Gl=i(),De=a("p"),De.textContent=ni,ql=i(),p(Ke.$$.fragment),Pl=i(),et=a("p"),et.innerHTML=ii,Yl=i(),p(tt.$$.fragment),Fl=i(),lt=a("p"),lt.innerHTML=si,Ol=i(),p(nt.$$.fragment),zl=i(),it=a("p"),it.innerHTML=ai,Dl=i(),st=a("p"),st.innerHTML=oi,Kl=i(),at=a("p"),at.innerHTML=ri,en=i(),p(ot.$$.fragment),tn=i(),pt=a("p"),this.h()},l(e){const t=fi("svelte-u9bgzb",document.head);y=o(t,"META",{name:!0,content:!0}),t.forEach(l),ct=s(e),rt=o(e,"P",{}),pi(rt).forEach(l),dt=s(e),c(M.$$.fragment,e),mt=s(e),c(k.$$.fragment,e),ut=s(e),c(g.$$.fragment,e),ht=s(e),w=o(e,"P",{"data-svelte-h":!0}),r(w)!=="svelte-1i1c9ni"&&(w.innerHTML=an),ft=s(e),$=o(e,"UL",{"data-svelte-h":!0}),r($)!=="svelte-1odnsz3"&&($.innerHTML=on),Tt=s(e),U=o(e,"P",{"data-svelte-h":!0}),r(U)!=="svelte-1gp9ycj"&&(U.innerHTML=rn),yt=s(e),J=o(e,"UL",{"data-svelte-h":!0}),r(J)!=="svelte-ysrhph"&&(J.innerHTML=pn),bt=s(e),C=o(e,"P",{"data-svelte-h":!0}),r(C)!=="svelte-vy7wcb"&&(C.innerHTML=cn),Mt=s(e),j=o(e,"P",{"data-svelte-h":!0}),r(j)!=="svelte-o9ssdv"&&(j.innerHTML=dn),kt=s(e),b=o(e,"BLOCKQUOTE",{class:!0,"data-svelte-h":!0}),r(b)!=="svelte-43d87d"&&(b.innerHTML=mn),gt=s(e),c(v.$$.fragment,e),wt=s(e),c(x.$$.fragment,e),$t=s(e),I=o(e,"P",{"data-svelte-h":!0}),r(I)!=="svelte-96m8sj"&&(I.innerHTML=un),Ut=s(e),c(_.$$.fragment,e),Jt=s(e),H=o(e,"P",{"data-svelte-h":!0}),r(H)!=="svelte-1b4vj4e"&&(H.textContent=hn),Ct=s(e),L=o(e,"OL",{"data-svelte-h":!0}),r(L)!=="svelte-3arzgs"&&(L.innerHTML=fn),jt=s(e),Z=o(e,"P",{"data-svelte-h":!0}),r(Z)!=="svelte-1ihjqjm"&&(Z.innerHTML=Tn),vt=s(e),c(V.$$.fragment,e),xt=s(e),B=o(e,"P",{"data-svelte-h":!0}),r(B)!=="svelte-1cac215"&&(B.innerHTML=yn),It=s(e),c(N.$$.fragment,e),_t=s(e),R=o(e,"P",{"data-svelte-h":!0}),r(R)!=="svelte-4lye9k"&&(R.innerHTML=bn),Ht=s(e),W=o(e,"P",{"data-svelte-h":!0}),r(W)!=="svelte-g5i707"&&(W.textContent=Mn),Lt=s(e),c(Q.$$.fragment,e),Zt=s(e),E=o(e,"P",{"data-svelte-h":!0}),r(E)!=="svelte-cn9mkc"&&(E.innerHTML=kn),Vt=s(e),c(A.$$.fragment,e),Bt=s(e),X=o(e,"P",{"data-svelte-h":!0}),r(X)!=="svelte-1prqyz3"&&(X.innerHTML=gn),Nt=s(e),S=o(e,"P",{"data-svelte-h":!0}),r(S)!=="svelte-1exh4w8"&&(S.innerHTML=wn),Rt=s(e),c(G.$$.fragment,e),Wt=s(e),q=o(e,"P",{"data-svelte-h":!0}),r(q)!=="svelte-1poutmy"&&(q.innerHTML=$n),Qt=s(e),c(P.$$.fragment,e),Et=s(e),Y=o(e,"P",{"data-svelte-h":!0}),r(Y)!=="svelte-s84xza"&&(Y.innerHTML=Un),At=s(e),c(F.$$.fragment,e),Xt=s(e),O=o(e,"P",{"data-svelte-h":!0}),r(O)!=="svelte-6oo725"&&(O.textContent=Jn),St=s(e),c(z.$$.fragment,e),Gt=s(e),D=o(e,"P",{"data-svelte-h":!0}),r(D)!=="svelte-1lqdx4"&&(D.textContent=Cn),qt=s(e),K=o(e,"UL",{"data-svelte-h":!0}),r(K)!=="svelte-c8vtob"&&(K.innerHTML=jn),Pt=s(e),c(ee.$$.fragment,e),Yt=s(e),te=o(e,"P",{"data-svelte-h":!0}),r(te)!=="svelte-1hgp1cr"&&(te.innerHTML=vn),Ft=s(e),c(le.$$.fragment,e),Ot=s(e),ne=o(e,"P",{"data-svelte-h":!0}),r(ne)!=="svelte-pgruc9"&&(ne.innerHTML=xn),zt=s(e),c(ie.$$.fragment,e),Dt=s(e),se=o(e,"UL",{"data-svelte-h":!0}),r(se)!=="svelte-cm9oc9"&&(se.innerHTML=In),Kt=s(e),c(ae.$$.fragment,e),el=s(e),oe=o(e,"UL",{"data-svelte-h":!0}),r(oe)!=="svelte-12rq95i"&&(oe.innerHTML=_n),tl=s(e),c(re.$$.fragment,e),ll=s(e),pe=o(e,"UL",{"data-svelte-h":!0}),r(pe)!=="svelte-1fzn2"&&(pe.innerHTML=Hn),nl=s(e),c(ce.$$.fragment,e),il=s(e),de=o(e,"P",{"data-svelte-h":!0}),r(de)!=="svelte-3rear0"&&(de.textContent=Ln),sl=s(e),me=o(e,"UL",{"data-svelte-h":!0}),r(me)!=="svelte-7mmcol"&&(me.innerHTML=Zn),al=s(e),c(ue.$$.fragment,e),ol=s(e),he=o(e,"P",{"data-svelte-h":!0}),r(he)!=="svelte-1weg0gu"&&(he.innerHTML=Vn),rl=s(e),fe=o(e,"P",{"data-svelte-h":!0}),r(fe)!=="svelte-1al5myg"&&(fe.textContent=Bn),pl=s(e),Te=o(e,"UL",{"data-svelte-h":!0}),r(Te)!=="svelte-1fbzu1m"&&(Te.innerHTML=Nn),cl=s(e),ye=o(e,"P",{"data-svelte-h":!0}),r(ye)!=="svelte-1mf578x"&&(ye.textContent=Rn),dl=s(e),c(be.$$.fragment,e),ml=s(e),Me=o(e,"UL",{"data-svelte-h":!0}),r(Me)!=="svelte-3vtlb2"&&(Me.innerHTML=Wn),ul=s(e),c(ke.$$.fragment,e),hl=s(e),ge=o(e,"UL",{"data-svelte-h":!0}),r(ge)!=="svelte-mx7mxt"&&(ge.innerHTML=Qn),fl=s(e),c(we.$$.fragment,e),Tl=s(e),$e=o(e,"UL",{"data-svelte-h":!0}),r($e)!=="svelte-1u3m3l7"&&($e.innerHTML=En),yl=s(e),c(Ue.$$.fragment,e),bl=s(e),Je=o(e,"UL",{"data-svelte-h":!0}),r(Je)!=="svelte-10okur"&&(Je.innerHTML=An),Ml=s(e),c(Ce.$$.fragment,e),kl=s(e),c(je.$$.fragment,e),gl=s(e),ve=o(e,"P",{"data-svelte-h":!0}),r(ve)!=="svelte-r7rot5"&&(ve.textContent=Xn),wl=s(e),xe=o(e,"UL",{"data-svelte-h":!0}),r(xe)!=="svelte-poxr41"&&(xe.innerHTML=Sn),$l=s(e),Ie=o(e,"P",{"data-svelte-h":!0}),r(Ie)!=="svelte-1ikzb58"&&(Ie.innerHTML=Gn),Ul=s(e),c(_e.$$.fragment,e),Jl=s(e),He=o(e,"P",{"data-svelte-h":!0}),r(He)!=="svelte-5ja9lk"&&(He.innerHTML=qn),Cl=s(e),c(Le.$$.fragment,e),jl=s(e),Ze=o(e,"P",{"data-svelte-h":!0}),r(Ze)!=="svelte-ssih46"&&(Ze.innerHTML=Pn),vl=s(e),c(Ve.$$.fragment,e),xl=s(e),Be=o(e,"P",{"data-svelte-h":!0}),r(Be)!=="svelte-1y8rjsx"&&(Be.innerHTML=Yn),Il=s(e),Ne=o(e,"P",{"data-svelte-h":!0}),r(Ne)!=="svelte-a3yu8e"&&(Ne.innerHTML=Fn),_l=s(e),c(Re.$$.fragment,e),Hl=s(e),c(We.$$.fragment,e),Ll=s(e),Qe=o(e,"P",{"data-svelte-h":!0}),r(Qe)!=="svelte-xosw3t"&&(Qe.innerHTML=On),Zl=s(e),Ee=o(e,"P",{"data-svelte-h":!0}),r(Ee)!=="svelte-a5yx0v"&&(Ee.innerHTML=zn),Vl=s(e),c(Ae.$$.fragment,e),Bl=s(e),Xe=o(e,"P",{"data-svelte-h":!0}),r(Xe)!=="svelte-9b7ddb"&&(Xe.textContent=Dn),Nl=s(e),c(Se.$$.fragment,e),Rl=s(e),Ge=o(e,"P",{"data-svelte-h":!0}),r(Ge)!=="svelte-4caz4s"&&(Ge.innerHTML=Kn),Wl=s(e),qe=o(e,"P",{"data-svelte-h":!0}),r(qe)!=="svelte-hkktty"&&(qe.innerHTML=ei),Ql=s(e),c(Pe.$$.fragment,e),El=s(e),c(Ye.$$.fragment,e),Al=s(e),Fe=o(e,"P",{"data-svelte-h":!0}),r(Fe)!=="svelte-q979am"&&(Fe.innerHTML=ti),Xl=s(e),c(Oe.$$.fragment,e),Sl=s(e),ze=o(e,"P",{"data-svelte-h":!0}),r(ze)!=="svelte-1uzdod8"&&(ze.textContent=li),Gl=s(e),De=o(e,"P",{"data-svelte-h":!0}),r(De)!=="svelte-s01sgi"&&(De.textContent=ni),ql=s(e),c(Ke.$$.fragment,e),Pl=s(e),et=o(e,"P",{"data-svelte-h":!0}),r(et)!=="svelte-1ucbtrx"&&(et.innerHTML=ii),Yl=s(e),c(tt.$$.fragment,e),Fl=s(e),lt=o(e,"P",{"data-svelte-h":!0}),r(lt)!=="svelte-gcopz4"&&(lt.innerHTML=si),Ol=s(e),c(nt.$$.fragment,e),zl=s(e),it=o(e,"P",{"data-svelte-h":!0}),r(it)!=="svelte-11q3n4g"&&(it.innerHTML=ai),Dl=s(e),st=o(e,"P",{"data-svelte-h":!0}),r(st)!=="svelte-zjr5ot"&&(st.innerHTML=oi),Kl=s(e),at=o(e,"P",{"data-svelte-h":!0}),r(at)!=="svelte-rt0n0n"&&(at.innerHTML=ri),en=s(e),c(ot.$$.fragment,e),tn=s(e),pt=o(e,"P",{}),pi(pt).forEach(l),this.h()},h(){nn(y,"name","hf:doc:metadata"),nn(y,"content",ki),nn(b,"class","tip")},m(e,t){Ti(document.head,y),n(e,ct,t),n(e,rt,t),n(e,dt,t),d(M,e,t),n(e,mt,t),d(k,e,t),n(e,ut,t),d(g,e,t),n(e,ht,t),n(e,w,t),n(e,ft,t),n(e,$,t),n(e,Tt,t),n(e,U,t),n(e,yt,t),n(e,J,t),n(e,bt,t),n(e,C,t),n(e,Mt,t),n(e,j,t),n(e,kt,t),n(e,b,t),n(e,gt,t),d(v,e,t),n(e,wt,t),d(x,e,t),n(e,$t,t),n(e,I,t),n(e,Ut,t),d(_,e,t),n(e,Jt,t),n(e,H,t),n(e,Ct,t),n(e,L,t),n(e,jt,t),n(e,Z,t),n(e,vt,t),d(V,e,t),n(e,xt,t),n(e,B,t),n(e,It,t),d(N,e,t),n(e,_t,t),n(e,R,t),n(e,Ht,t),n(e,W,t),n(e,Lt,t),d(Q,e,t),n(e,Zt,t),n(e,E,t),n(e,Vt,t),d(A,e,t),n(e,Bt,t),n(e,X,t),n(e,Nt,t),n(e,S,t),n(e,Rt,t),d(G,e,t),n(e,Wt,t),n(e,q,t),n(e,Qt,t),d(P,e,t),n(e,Et,t),n(e,Y,t),n(e,At,t),d(F,e,t),n(e,Xt,t),n(e,O,t),n(e,St,t),d(z,e,t),n(e,Gt,t),n(e,D,t),n(e,qt,t),n(e,K,t),n(e,Pt,t),d(ee,e,t),n(e,Yt,t),n(e,te,t),n(e,Ft,t),d(le,e,t),n(e,Ot,t),n(e,ne,t),n(e,zt,t),d(ie,e,t),n(e,Dt,t),n(e,se,t),n(e,Kt,t),d(ae,e,t),n(e,el,t),n(e,oe,t),n(e,tl,t),d(re,e,t),n(e,ll,t),n(e,pe,t),n(e,nl,t),d(ce,e,t),n(e,il,t),n(e,de,t),n(e,sl,t),n(e,me,t),n(e,al,t),d(ue,e,t),n(e,ol,t),n(e,he,t),n(e,rl,t),n(e,fe,t),n(e,pl,t),n(e,Te,t),n(e,cl,t),n(e,ye,t),n(e,dl,t),d(be,e,t),n(e,ml,t),n(e,Me,t),n(e,ul,t),d(ke,e,t),n(e,hl,t),n(e,ge,t),n(e,fl,t),d(we,e,t),n(e,Tl,t),n(e,$e,t),n(e,yl,t),d(Ue,e,t),n(e,bl,t),n(e,Je,t),n(e,Ml,t),d(Ce,e,t),n(e,kl,t),d(je,e,t),n(e,gl,t),n(e,ve,t),n(e,wl,t),n(e,xe,t),n(e,$l,t),n(e,Ie,t),n(e,Ul,t),d(_e,e,t),n(e,Jl,t),n(e,He,t),n(e,Cl,t),d(Le,e,t),n(e,jl,t),n(e,Ze,t),n(e,vl,t),d(Ve,e,t),n(e,xl,t),n(e,Be,t),n(e,Il,t),n(e,Ne,t),n(e,_l,t),d(Re,e,t),n(e,Hl,t),d(We,e,t),n(e,Ll,t),n(e,Qe,t),n(e,Zl,t),n(e,Ee,t),n(e,Vl,t),d(Ae,e,t),n(e,Bl,t),n(e,Xe,t),n(e,Nl,t),d(Se,e,t),n(e,Rl,t),n(e,Ge,t),n(e,Wl,t),n(e,qe,t),n(e,Ql,t),d(Pe,e,t),n(e,El,t),d(Ye,e,t),n(e,Al,t),n(e,Fe,t),n(e,Xl,t),d(Oe,e,t),n(e,Sl,t),n(e,ze,t),n(e,Gl,t),n(e,De,t),n(e,ql,t),d(Ke,e,t),n(e,Pl,t),n(e,et,t),n(e,Yl,t),d(tt,e,t),n(e,Fl,t),n(e,lt,t),n(e,Ol,t),d(nt,e,t),n(e,zl,t),n(e,it,t),n(e,Dl,t),n(e,st,t),n(e,Kl,t),n(e,at,t),n(e,en,t),d(ot,e,t),n(e,tn,t),n(e,pt,t),ln=!0},p:di,i(e){ln||(m(M.$$.fragment,e),m(k.$$.fragment,e),m(g.$$.fragment,e),m(v.$$.fragment,e),m(x.$$.fragment,e),m(_.$$.fragment,e),m(V.$$.fragment,e),m(N.$$.fragment,e),m(Q.$$.fragment,e),m(A.$$.fragment,e),m(G.$$.fragment,e),m(P.$$.fragment,e),m(F.$$.fragment,e),m(z.$$.fragment,e),m(ee.$$.fragment,e),m(le.$$.fragment,e),m(ie.$$.fragment,e),m(ae.$$.fragment,e),m(re.$$.fragment,e),m(ce.$$.fragment,e),m(ue.$$.fragment,e),m(be.$$.fragment,e),m(ke.$$.fragment,e),m(we.$$.fragment,e),m(Ue.$$.fragment,e),m(Ce.$$.fragment,e),m(je.$$.fragment,e),m(_e.$$.fragment,e),m(Le.$$.fragment,e),m(Ve.$$.fragment,e),m(Re.$$.fragment,e),m(We.$$.fragment,e),m(Ae.$$.fragment,e),m(Se.$$.fragment,e),m(Pe.$$.fragment,e),m(Ye.$$.fragment,e),m(Oe.$$.fragment,e),m(Ke.$$.fragment,e),m(tt.$$.fragment,e),m(nt.$$.fragment,e),m(ot.$$.fragment,e),ln=!0)},o(e){u(M.$$.fragment,e),u(k.$$.fragment,e),u(g.$$.fragment,e),u(v.$$.fragment,e),u(x.$$.fragment,e),u(_.$$.fragment,e),u(V.$$.fragment,e),u(N.$$.fragment,e),u(Q.$$.fragment,e),u(A.$$.fragment,e),u(G.$$.fragment,e),u(P.$$.fragment,e),u(F.$$.fragment,e),u(z.$$.fragment,e),u(ee.$$.fragment,e),u(le.$$.fragment,e),u(ie.$$.fragment,e),u(ae.$$.fragment,e),u(re.$$.fragment,e),u(ce.$$.fragment,e),u(ue.$$.fragment,e),u(be.$$.fragment,e),u(ke.$$.fragment,e),u(we.$$.fragment,e),u(Ue.$$.fragment,e),u(Ce.$$.fragment,e),u(je.$$.fragment,e),u(_e.$$.fragment,e),u(Le.$$.fragment,e),u(Ve.$$.fragment,e),u(Re.$$.fragment,e),u(We.$$.fragment,e),u(Ae.$$.fragment,e),u(Se.$$.fragment,e),u(Pe.$$.fragment,e),u(Ye.$$.fragment,e),u(Oe.$$.fragment,e),u(Ke.$$.fragment,e),u(tt.$$.fragment,e),u(nt.$$.fragment,e),u(ot.$$.fragment,e),ln=!1},d(e){e&&(l(ct),l(rt),l(dt),l(mt),l(ut),l(ht),l(w),l(ft),l($),l(Tt),l(U),l(yt),l(J),l(bt),l(C),l(Mt),l(j),l(kt),l(b),l(gt),l(wt),l($t),l(I),l(Ut),l(Jt),l(H),l(Ct),l(L),l(jt),l(Z),l(vt),l(xt),l(B),l(It),l(_t),l(R),l(Ht),l(W),l(Lt),l(Zt),l(E),l(Vt),l(Bt),l(X),l(Nt),l(S),l(Rt),l(Wt),l(q),l(Qt),l(Et),l(Y),l(At),l(Xt),l(O),l(St),l(Gt),l(D),l(qt),l(K),l(Pt),l(Yt),l(te),l(Ft),l(Ot),l(ne),l(zt),l(Dt),l(se),l(Kt),l(el),l(oe),l(tl),l(ll),l(pe),l(nl),l(il),l(de),l(sl),l(me),l(al),l(ol),l(he),l(rl),l(fe),l(pl),l(Te),l(cl),l(ye),l(dl),l(ml),l(Me),l(ul),l(hl),l(ge),l(fl),l(Tl),l($e),l(yl),l(bl),l(Je),l(Ml),l(kl),l(gl),l(ve),l(wl),l(xe),l($l),l(Ie),l(Ul),l(Jl),l(He),l(Cl),l(jl),l(Ze),l(vl),l(xl),l(Be),l(Il),l(Ne),l(_l),l(Hl),l(Ll),l(Qe),l(Zl),l(Ee),l(Vl),l(Bl),l(Xe),l(Nl),l(Rl),l(Ge),l(Wl),l(qe),l(Ql),l(El),l(Al),l(Fe),l(Xl),l(Sl),l(ze),l(Gl),l(De),l(ql),l(Pl),l(et),l(Yl),l(Fl),l(lt),l(Ol),l(zl),l(it),l(Dl),l(st),l(Kl),l(at),l(en),l(tn),l(pt)),l(y),h(M,e),h(k,e),h(g,e),h(v,e),h(x,e),h(_,e),h(V,e),h(N,e),h(Q,e),h(A,e),h(G,e),h(P,e),h(F,e),h(z,e),h(ee,e),h(le,e),h(ie,e),h(ae,e),h(re,e),h(ce,e),h(ue,e),h(be,e),h(ke,e),h(we,e),h(Ue,e),h(Ce,e),h(je,e),h(_e,e),h(Le,e),h(Ve,e),h(Re,e),h(We,e),h(Ae,e),h(Se,e),h(Pe,e),h(Ye,e),h(Oe,e),h(Ke,e),h(tt,e),h(nt,e),h(ot,e)}}}const ki='{"title":"Writing Hub kernels with kernel-builder","local":"writing-hub-kernels-with-kernel-builder","sections":[{"title":"Introduction","local":"introduction","sections":[],"depth":2},{"title":"Setting up environment","local":"setting-up-environment","sections":[{"title":"Quick install","local":"quick-install","sections":[],"depth":3},{"title":"Cloud environment","local":"cloud-environment","sections":[],"depth":3}],"depth":2},{"title":"Starting a new kernel","local":"starting-a-new-kernel","sections":[],"depth":2},{"title":"Kernel project layout","local":"kernel-project-layout","sections":[],"depth":2},{"title":"build.toml","local":"buildtoml","sections":[{"title":"general","local":"general","sections":[],"depth":3},{"title":"general.hub","local":"generalhub","sections":[],"depth":3},{"title":"general.cuda","local":"generalcuda","sections":[],"depth":3},{"title":"torch","local":"torch","sections":[],"depth":3},{"title":"kernel.<name>","local":"kernelltnamegt","sections":[{"title":"cuda","local":"cuda","sections":[],"depth":4},{"title":"rocm","local":"rocm","sections":[],"depth":4},{"title":"xpu","local":"xpu","sections":[],"depth":4}],"depth":3},{"title":"cpu","local":"cpu","sections":[],"depth":3}],"depth":2},{"title":"Torch bindings","local":"torch-bindings","sections":[{"title":"Defining bindings","local":"defining-bindings","sections":[],"depth":3}],"depth":2},{"title":"Using kernel functions from Python","local":"using-kernel-functions-from-python","sections":[],"depth":2},{"title":"Registering Torch operators","local":"registering-torch-operators","sections":[],"depth":2},{"title":"Kernel tests","local":"kernel-tests","sections":[],"depth":2},{"title":"Kernel docs","local":"kernel-docs","sections":[],"depth":2}],"depth":1}';function gi(sn){return mi(()=>{new URLSearchParams(window.location.search).get("fw")}),[]}class ji extends ui{constructor(y){super(),hi(this,y,gi,Mi,ci,{})}}export{ji as component}; | |
Xet Storage Details
- Size:
- 46.8 kB
- Xet hash:
- abe03ceb0e4f948e6cd6f91f5d620a409dc2d3d2c46db71f0a32c964950329cc
·
Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.