quantization.cpp 303 B

123456789101112131415
  1. #include <torch/extension.h>
  2. torch::Tensor awq_gemm(
  3. torch::Tensor _in_feats,
  4. torch::Tensor _kernel,
  5. torch::Tensor _scaling_factors,
  6. torch::Tensor _zeros,
  7. int split_k_iters);
  8. PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
  9. m.def(
  10. "awq_gemm",
  11. &awq_gemm,
  12. "Quantized GEMM for AWQ");
  13. }