@@ -14,6 +14,7 @@ static __global__ void mul_mat_f(
14
14
const int ncols, const int nchannels_y, const int stride_row, const int stride_col_y, const int stride_col_dst,
15
15
const int channel_ratio, const int stride_channel_x, const int stride_channel_y, const int stride_channel_dst,
16
16
const int sample_ratio, const int stride_sample_x, const int stride_sample_y, const int stride_sample_dst) {
17
+ #if !defined(GGML_USE_HIP) && !defined(GGML_USE_MUSA)
17
18
typedef tile<16 , 8 , T> tile_A;
18
19
typedef tile< 8 , 8 , T> tile_B;
19
20
typedef tile<16 , 8 , float > tile_C;
@@ -130,6 +131,13 @@ static __global__ void mul_mat_f(
130
131
}
131
132
dst[j*stride_col_dst + row0 + threadIdx .x ] = sum;
132
133
}
134
+ #else
135
+ NO_DEVICE_CODE;
136
+ GGML_UNUSED (x); GGML_UNUSED (y); GGML_UNUSED (ids); GGML_UNUSED (dst);
137
+ GGML_UNUSED (ncols); GGML_UNUSED (nchannels_y); GGML_UNUSED (stride_row); GGML_UNUSED (stride_col_y); GGML_UNUSED (stride_col_dst);
138
+ GGML_UNUSED (channel_ratio); GGML_UNUSED (stride_channel_x); GGML_UNUSED (stride_channel_y); GGML_UNUSED (stride_channel_dst);
139
+ GGML_UNUSED (sample_ratio); GGML_UNUSED (stride_sample_x); GGML_UNUSED (stride_sample_y); GGML_UNUSED (stride_sample_dst);
140
+ #endif // !defined(GGML_USE_HIP) && !defined(GGML_USE_MUSA)
133
141
}
134
142
135
143
template <typename T, int cols_per_block>
0 commit comments