Skip to content

Commit

Permalink
add restrict for dst
Browse files Browse the repository at this point in the history
  • Loading branch information
piDack committed Aug 29, 2024
1 parent 5999d6d commit 316a049
Show file tree
Hide file tree
Showing 2 changed files with 2 additions and 2 deletions.
2 changes: 1 addition & 1 deletion ggml/src/ggml-cuda/ssm_conv.cu
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@ static __global__ void ssm_conv_f32(
const float * __restrict__ src0, const float * __restrict__ src1,
const int src0_nb0, const int src0_nb1, const int src0_nb2,
const int src1_nb1,
float * dst,
float * __restrict__ dst,
const int dst_nb0, const int dst_nb1, const int dst_nb2,
const int nc, const int ncs, const int nr, const int n_t, const int n_s) {

Expand Down
2 changes: 1 addition & 1 deletion ggml/src/ggml-cuda/ssm_scan.cu
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@ static __global__ void ssm_scan_f32(
const int src3_nb1,
const int src4_nb1, const int src4_nb2,
const int src5_nb1, const int src5_nb2,
float * dst,
float * __restrict__ dst,
const int nc, const int nr, const int n_t, const int n_s) {

// const int row = blockIdx.x*blockDim.y + threadIdx.y;
Expand Down

0 comments on commit 316a049

Please sign in to comment.