From a8180351baa3749dc3b22e72d69e4a7bd2dca452 Mon Sep 17 00:00:00 2001 From: Eric Buehler Date: Tue, 7 Jan 2025 20:47:29 -0500 Subject: [PATCH] Include assert --- mistralrs-core/src/cuda/nonzero_bitwise.cu | 7 +++---- mistralrs-quant/kernels/hqq/hqq.cu | 1 + 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/mistralrs-core/src/cuda/nonzero_bitwise.cu b/mistralrs-core/src/cuda/nonzero_bitwise.cu index f140c01e1..ced2f9ff8 100644 --- a/mistralrs-core/src/cuda/nonzero_bitwise.cu +++ b/mistralrs-core/src/cuda/nonzero_bitwise.cu @@ -2,6 +2,7 @@ // https://github.com/pytorch/pytorch/blob/65aa16f968af2cd18ff8c25cc657e7abda594bfc/aten/src/ATen/native/cuda/Nonzero.cu #include #include +#include int next_power_of_2(const uint32_t num_nonzero) { int result = 1; @@ -45,9 +46,7 @@ void count_nonzero(const T *d_in, const uint32_t N, uint32_t *h_out) { #define COUNT_NONZERO_OP_DUMMY(RUST_NAME) \ extern "C" uint32_t count_nonzero_##RUST_NAME(const uint16_t *d_in, \ uint32_t N) { \ - uint32_t result; \ - count_nonzero(d_in, N, &result); \ - return result; \ + return 0; \ } #if __CUDA_ARCH__ >= 800 @@ -130,7 +129,7 @@ void nonzero(const T *d_in, const uint32_t N, const uint32_t num_nonzero, extern "C" void nonzero_##RUST_NAME( \ const uint16_t *d_in, uint32_t N, uint32_t num_nonzero, \ const uint32_t *dims, uint32_t num_dims, uint32_t *d_out) { \ - nonzero(d_in, N, num_nonzero, dims, num_dims, d_out); \ + assert(false); \ } #if __CUDA_ARCH__ >= 800 diff --git a/mistralrs-quant/kernels/hqq/hqq.cu b/mistralrs-quant/kernels/hqq/hqq.cu index 1cd33ac3b..2efd7ac85 100644 --- a/mistralrs-quant/kernels/hqq/hqq.cu +++ b/mistralrs-quant/kernels/hqq/hqq.cu @@ -3,6 +3,7 @@ #include #include #include +#include #if __CUDA_ARCH__ >= 530 #include "cuda_fp16.h"