| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| #include "kernel.h" |
|
|
| namespace tensorrt_llm |
| { |
| namespace kernels |
| { |
|
|
| template struct WeightOnlyBatchedGemvKernelLauncher<WeightOnlyQuantType::Int8b, WeightOnlyPerChannel, |
| IdentityActivation, false, false, 2, 2, 256>; |
|
|
| template struct WeightOnlyBatchedGemvKernelLauncher<WeightOnlyQuantType::Int8b, WeightOnlyGroupWise<64>, |
| IdentityActivation, true, true, 2, 2, 256>; |
| template struct WeightOnlyBatchedGemvKernelLauncher<WeightOnlyQuantType::Int8b, WeightOnlyGroupWise<64>, |
| IdentityActivation, true, false, 2, 2, 256>; |
| template struct WeightOnlyBatchedGemvKernelLauncher<WeightOnlyQuantType::Int8b, WeightOnlyGroupWise<64>, |
| IdentityActivation, false, true, 2, 2, 256>; |
| template struct WeightOnlyBatchedGemvKernelLauncher<WeightOnlyQuantType::Int8b, WeightOnlyGroupWise<64>, |
| IdentityActivation, false, false, 2, 2, 256>; |
|
|
| template struct WeightOnlyBatchedGemvKernelLauncher<WeightOnlyQuantType::Int8b, WeightOnlyGroupWise<128>, |
| IdentityActivation, true, true, 2, 2, 256>; |
| template struct WeightOnlyBatchedGemvKernelLauncher<WeightOnlyQuantType::Int8b, WeightOnlyGroupWise<128>, |
| IdentityActivation, true, false, 2, 2, 256>; |
| template struct WeightOnlyBatchedGemvKernelLauncher<WeightOnlyQuantType::Int8b, WeightOnlyGroupWise<128>, |
| IdentityActivation, false, true, 2, 2, 256>; |
| template struct WeightOnlyBatchedGemvKernelLauncher<WeightOnlyQuantType::Int8b, WeightOnlyGroupWise<128>, |
| IdentityActivation, false, false, 2, 2, 256>; |
|
|
| } |
| } |
|
|