fix NVCC version on Makefile, __halves2half2 -> make_half2

2025-02-02 15:02:47 +01:00 · 2023-07-16 00:20:43 +02:00 · 2023-07-16 00:20:43 +02:00 · 33ab185dd1
commit 33ab185dd1
parent 24cc6f008f
2 changed files with 2 additions and 1 deletions
--- a/1
+++ b/1
@ -176,6 +176,7 @@ ifdef LLAMA_CUDA
 	OBJS      += ggml-cuda.o
 	NVCC      = nvcc
 	NVCCFLAGS = --forward-unknown-to-host-compiler
+	NVCCV 	  := $(shell $(NVCC) --version | tail -n 1)
 ifdef LLAMA_DEBUG
 	NVCCFLAGS += -lineinfo
 endif # LLAMA_DEBUG
--- a/ggml-cuda-kern.h
+++ b/ggml-cuda-kern.h
@ -14,7 +14,7 @@ template<> struct vec2_t_impl<float>  { typedef float2 type; };
 template<typename T> using vec2_t = typename vec2_t_impl<T>::type;

 template<typename T> inline __host__ __device__ vec2_t<T> make_vec2_t(const T & x, const T & y);
-template<> inline __host__ __device__ vec2_t<half>  make_vec2_t(const  half & x, const  half & y) { return __halves2half2(x, y); }
+template<> inline __host__ __device__ vec2_t<half>  make_vec2_t(const  half & x, const  half & y) { return make_half2 (x, y); }
 template<> inline __host__ __device__ vec2_t<float> make_vec2_t(const float & x, const float & y) { return make_float2(x, y); }

 // the cuda headers define operators for half2, but not for float2