From 45768e4dce976dbafaa52c6a2416b1313d4c0cf3 Mon Sep 17 00:00:00 2001 From: Tronica Date: Sun, 26 Jan 2025 20:05:25 +0100 Subject: [PATCH 1/2] fix typos kernels.cu --- ntt/kernels.cu | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ntt/kernels.cu b/ntt/kernels.cu index 0b36033..0152423 100644 --- a/ntt/kernels.cu +++ b/ntt/kernels.cu @@ -59,7 +59,7 @@ template __launch_bounds__(192, 2) __global__ void bit_rev_permutation_z(fr_t* out, const fr_t* in, uint32_t lg_domain_size) { - static_assert((Z_COUNT & (Z_COUNT-1)) == 0, "unvalid Z_COUNT"); + static_assert((Z_COUNT & (Z_COUNT-1)) == 0, "invalid Z_COUNT"); const uint32_t LG_Z_COUNT = lg2(Z_COUNT); extern __shared__ int xchg_bit_rev[]; From f202ba41d49bc9c542e23e59e998d866e19b9079 Mon Sep 17 00:00:00 2001 From: Tronica Date: Sun, 26 Jan 2025 20:06:22 +0100 Subject: [PATCH 2/2] fix typos sort.cuh --- msm/sort.cuh | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/msm/sort.cuh b/msm/sort.cuh index 0b2928c..8a9cd09 100644 --- a/msm/sort.cuh +++ b/msm/sort.cuh @@ -18,7 +18,7 @@ #endif __launch_bounds__(SORT_BLOCKDIM) -__global__ void sort(vec2d_t inouts, size_t len, uint32_t win, +__global__ void sort(vec2d_t inputs, size_t len, uint32_t win, vec2d_t temps, vec2d_t histograms, uint32_t wbits, uint32_t lsbits0, uint32_t lsbits1); @@ -364,12 +364,12 @@ __global__ void sort(uint32_t inout[], size_t len, uint2 temp[], #endif __launch_bounds__(SORT_BLOCKDIM) -__global__ void sort(vec2d_t inouts, size_t len, uint32_t win, +__global__ void sort(vec2d_t inputs, size_t len, uint32_t win, vec2d_t temps, vec2d_t histograms, uint32_t wbits, uint32_t lsbits0, uint32_t lsbits1) { win += blockIdx.y; - sort_row(inouts[win], len, temps[blockIdx.y], histograms[win], + sort_row(inputs[win], len, temps[blockIdx.y], histograms[win], wbits, blockIdx.y==0 ? lsbits0 : lsbits1); }