File tree 2 files changed +10
-0
lines changed
2 files changed +10
-0
lines changed Original file line number Diff line number Diff line change @@ -39,6 +39,7 @@ set(fbgemm_gpu_sources_cpu_static
39
39
src/layout_transform_ops/layout_transform_ops_cpu.cpp
40
40
src/quantize_ops/quantize_ops_cpu.cpp
41
41
src/quantize_ops/quantize_ops_meta.cpp
42
+ src/sparse_ops/sparse_async_batched_cumsum.cpp
42
43
src/sparse_ops/sparse_ops_cpu.cpp
43
44
src/sparse_ops/sparse_ops_meta.cpp
44
45
${tbe_eeg_cpu_sources} )
@@ -101,6 +102,7 @@ if(NOT FBGEMM_BUILD_VARIANT STREQUAL BUILD_VARIANT_CPU)
101
102
src/quantize_ops/quantize_msfp.cu
102
103
src/quantize_ops/quantize_padded_fp8_rowwise.cu
103
104
src/quantize_ops/quantize_mx.cu
105
+ src/sparse_ops/sparse_async_batched_cumsum.cu
104
106
src/sparse_ops/sparse_block_bucketize_features.cu
105
107
src/sparse_ops/sparse_bucketize_features.cu
106
108
src/sparse_ops/sparse_batched_unary_embeddings.cu
Original file line number Diff line number Diff line change 6
6
* LICENSE file in the root directory of this source tree.
7
7
*/
8
8
9
+ #ifdef __HIP_PLATFORM_AMD__
10
+ #include < hipcub/block/block_scan.hpp>
11
+ #else
9
12
#include < cub/block/block_scan.cuh>
13
+ #endif
10
14
#include " common.cuh"
11
15
12
16
static constexpr uint32_t kMaxThreads = 1024 ;
13
17
18
+ #ifdef __HIP_PLATFORM_AMD__
19
+ namespace cub = hipcub;
20
+ #endif
21
+
14
22
namespace fbgemm_gpu {
15
23
16
24
C10_ALWAYS_INLINE uint32_t next_power_of_2 (uint32_t n) {
You can’t perform that action at this time.
0 commit comments