cuda_launch.h 707 B

123456789101112131415161718192021222324252627282930313233343536373839
  1. #include <torch/extension.h>
  2. #include <ATen/ATen.h>
  3. #include <vector>
  4. #define min(a, b) ((a)<(b)?(a):(b))
  5. #define max(a, b) ((a)>(b)?(a):(b))
  6. std::vector<at::Tensor> index_max_kernel(
  7. at::Tensor index_vals,
  8. at::Tensor indices,
  9. int A_num_block,
  10. int B_num_block
  11. );
  12. at::Tensor mm_to_sparse_kernel(
  13. at::Tensor dense_A,
  14. at::Tensor dense_B,
  15. at::Tensor indices
  16. );
  17. at::Tensor sparse_dense_mm_kernel(
  18. at::Tensor sparse_A,
  19. at::Tensor indices,
  20. at::Tensor dense_B,
  21. int A_num_block
  22. );
  23. at::Tensor reduce_sum_kernel(
  24. at::Tensor sparse_A,
  25. at::Tensor indices,
  26. int A_num_block,
  27. int B_num_block
  28. );
  29. at::Tensor scatter_kernel(
  30. at::Tensor dense_A,
  31. at::Tensor indices,
  32. int B_num_block
  33. );