flash-mla / csrc /api /api.cpp
medmekk's picture
Upload folder using huggingface_hub
ccef021 verified
// UNUSED BY KERNEL-BUILDER
// File is retained for reference, but is not currently used in the build process.
// #include <pybind11/pybind11.h>
// #include "sparse_fwd.h"
// #include "sparse_decode.h"
// #include "dense_decode.h"
// #include "dense_fwd.h"
// PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
// m.doc() = "FlashMLA";
// m.def("sparse_decode_fwd", &sparse_attn_decode_interface);
// m.def("dense_decode_fwd", &dense_attn_decode_interface);
// m.def("sparse_prefill_fwd", &sparse_attn_prefill_interface);
// m.def("dense_prefill_fwd", &FMHACutlassSM100FwdRun);
// m.def("dense_prefill_bwd", &FMHACutlassSM100BwdRun);
// }