@@ -26,62 +26,95 @@ file(GLOB kernel_impl_h "impl/*.h" "selected_rows/impl/*.h")
2626file (GLOB kernel_primitive_h "primitive/*.h" )
2727
2828# fusion ops would be included here
29- #file(
30- # GLOB kernel_cu
31- # RELATIVE "${CMAKE_CURRENT_SOURCE_DIR}"
32- # "gpu/*.cu"
33- # "gpu/*.cu.cc"
34- # "gpudnn/*.cu"
35- # "kps/*.cu"
36- # "legacy/kps/*.cu"
37- # "legacy/gpu/*.cu"
38- # "selected_rows/gpu/*.cu"
39- # "sparse/gpu/*.cu"
40- # "strings/gpu/*.cu"
41- # "fusion/gpu/*.cu")
4229file (
4330 GLOB kernel_cu
4431 RELATIVE "${CMAKE_CURRENT_SOURCE_DIR} "
45- "gpu/s*.cu.cc"
46- "gpu/c*.cu"
47- "gpu/s*.cu"
48- "gpu/abs_kernel.cu"
49- "gpu/uniform_kernel.cu"
50- "gpu/activation_kernel.cu"
51- "gpu/full_kernel.cu"
52- "gpu/cholesky_kernel.cu"
53- "gpu/cholesky_solve_kernel.cu"
54- "gpu/svd_kernel.cu"
55- "gpu/p_norm_grad_kernel.cu"
56- "gpu/matmul_kernel.cu"
57- "gpu/expand_kernel.cu"
58- "gpu/isfinite_kernel.cu"
32+ "gpu/*.cu"
33+ "gpu/*.cu.cc"
34+ "gpudnn/*.cu"
5935 "kps/*.cu"
60- "legacy/gpu/uniform_kernel.cu"
61- "sparse/gpu/mask_kernel.cu"
6236 "legacy/kps/*.cu"
63- )
64- list (REMOVE_ITEM kernel_cu
65- "gpu/check_numerics_kernel.cu"
66- "gpu/cross_entropy_grad_kernel.cu"
67- "gpu/instance_norm_grad_kernel.cu"
68- "gpu/cross_entropy_kernel.cu"
69- "gpu/cholesky_grad_kernel.cu"
70- "gpu/cholesky_solve_grad_kernel.cu"
71- "gpu/conv_transpose_kernel.cu"
72- "gpu/conv_grad_kernel.cu"
73- "gpu/solve_kernel.cu"
74- "gpu/solve_grad_kernel.cu"
75- "gpu/stft_kernel.cu"
76- "gpu/conv_kernel.cu"
77- "gpu/cudnn_lstm_grad_kernel.cu"
78- "gpu/cudnn_lstm_kernel.cu"
79- "gpu/softmax_kernel.cu"
80- "gpu/slogdeterminant_grad_kernel.cu"
81- "gpu/spectral_norm_grad_kernel.cu"
82- "gpu/spectral_norm_kernel.cu"
83- "gpu/svd_grad_kernel.cu"
84- "gpu/conv_transpose_grad_kernel.cu" )
37+ "legacy/gpu/*.cu"
38+ "selected_rows/gpu/*.cu"
39+ "sparse/gpu/*.cu"
40+ "strings/gpu/*.cu"
41+ "fusion/gpu/*.cu" )
42+
43+ # FIXME(@MTAI): compilation error will occur when compiling the following files.
44+ # This need to be fixed later.
45+ if (WITH_MUSA)
46+ list (REMOVE_ITEM kernel_cu
47+ "fusion/gpu/fused_softmax_mask_grad_kernel.cu"
48+ "fusion/gpu/fused_softmax_mask_kernel.cu"
49+ "gpu/batch_norm_grad_kernel.cu"
50+ "gpu/batch_norm_kernel.cu"
51+ "gpu/check_numerics_kernel.cu"
52+ "gpu/cholesky_grad_kernel.cu"
53+ "gpu/cholesky_solve_grad_kernel.cu"
54+ "gpu/conv_grad_kernel.cu"
55+ "gpu/conv_kernel.cu"
56+ "gpu/cross_entropy_grad_kernel.cu"
57+ "gpu/cross_entropy_kernel.cu"
58+ "gpu/conv_transpose_grad_kernel.cu"
59+ "gpu/conv_transpose_kernel.cu"
60+ "gpu/cudnn_lstm_grad_kernel.cu"
61+ "gpu/cudnn_lstm_kernel.cu"
62+ "gpu/depthwise_conv_grad_kernel.cu"
63+ "gpu/depthwise_conv_kernel.cu"
64+ "gpu/dist_kernel.cu"
65+ "gpu/elementwise_divide_grad_kernel.cu"
66+ "gpu/elementwise_grad_kernel.cu"
67+ "gpu/elementwise_multiply_grad_kernel.cu"
68+ "gpu/erfinv_kernel.cu"
69+ "gpu/exponential_kernel.cu"
70+ "gpu/fft_grad_kernel.cu"
71+ "gpu/fft_kernel.cu"
72+ "gpu/fused_softmax_mask_grad_kernel.cu"
73+ "gpu/gaussian_kernel.cu"
74+ "gpu/gelu_grad_kernel.cu"
75+ "gpu/gelu_kernel.cu"
76+ "gpu/histogram_kernel.cu"
77+ "gpu/instance_norm_grad_kernel.cu"
78+ "gpu/instance_norm_kernel.cu"
79+ "gpu/interpolate_grad_kernel.cu"
80+ "gpu/kthvalue_grad_kernel.cu"
81+ "gpu/kthvalue_kernel.cu"
82+ "gpu/layer_norm_grad_kernel.cu"
83+ "gpu/layer_norm_kernel.cu"
84+ "gpu/llm_int8_mat_mul_kernel.cu"
85+ "gpu/log_softmax_grad_kernel.cu"
86+ "gpu/log_softmax_kernel.cu"
87+ "gpu/lstsq_kernel.cu"
88+ "gpu/nanmedian_kernel.cu"
89+ "gpu/rnn_grad_kernel.cu.cc"
90+ "gpu/rnn_kernel.cu.cc"
91+ "gpu/slogdeterminant_grad_kernel.cu"
92+ "gpu/solve_grad_kernel.cu"
93+ "gpu/solve_kernel.cu"
94+ "gpu/spectral_norm_grad_kernel.cu"
95+ "gpu/spectral_norm_kernel.cu"
96+ "gpu/stft_kernel.cu"
97+ "gpu/svd_grad_kernel.cu"
98+ "gpu/top_k_grad_kernel.cu"
99+ "gpu/top_k_kernel.cu"
100+ "gpu/truncated_gaussian_random_kernel.cu"
101+ "gpudnn/affine_grid_grad_kernel.cu"
102+ "gpudnn/affine_grid_kernel.cu"
103+ "gpudnn/softmax_grad_kernel.cu"
104+ "gpudnn/softmax_kernel.cu"
105+ "gpudnn/conv_grad_kernel.cu"
106+ "gpudnn/conv_kernel.cu"
107+ "gpudnn/conv_transpose_grad_kernel.cu"
108+ "gpudnn/conv_transpose_kernel.cu"
109+ "gpudnn/pool_grad_kernel.cu"
110+ "gpudnn/pool_kernel.cu"
111+ "sparse/gpu/softmax_grad_kernel.cu"
112+ "sparse/gpu/softmax_kernel.cu"
113+ "sparse/gpu/conv_kernel.cu"
114+ "sparse/gpu/pool_kernel.cu"
115+ "strings/gpu/strings_copy_kernel.cu"
116+ "strings/gpu/strings_lower_upper_kernel.cu" )
117+ endif ()
85118
86119if (APPLE OR WIN32 )
87120 list (REMOVE_ITEM kernel_cu "fusion/gpu/fusion_group_kernel.cu" )
0 commit comments