Skip to content

Commit

Permalink
Merge pull request #468 from ColorfulDick/master
Browse files Browse the repository at this point in the history
修复__restrict__导致的restrict is not allowed错误
  • Loading branch information
ztxz16 authored Jun 17, 2024
2 parents 3b7dbb2 + 9c76015 commit 47739b7
Showing 1 changed file with 1 addition and 1 deletion.
2 changes: 1 addition & 1 deletion src/devices/cuda/fastllm-cuda.cu
Original file line number Diff line number Diff line change
Expand Up @@ -391,7 +391,7 @@ __global__ void FastllmSwigluKernel(float* a, float *b, int len, int spatial, in
}
}

__global__ void FastllmSwigluKernel(half* __restrict__ a, half __restrict__ *b, int len, int spatial, int mid) {
__global__ void FastllmSwigluKernel(half* __restrict__ a, half* __restrict__ b, int len, int spatial, int mid) {
int idx = threadIdx.x + blockIdx.x * blockDim.x;
if (idx < len) {
int id = idx / mid * spatial + idx % mid;
Expand Down

0 comments on commit 47739b7

Please sign in to comment.