mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-13 12:10:18 +00:00
fix NVCC version on Makefile, __halves2half2 -> make_half2
This commit is contained in:
parent
24cc6f008f
commit
33ab185dd1
1
Makefile
1
Makefile
@ -176,6 +176,7 @@ ifdef LLAMA_CUDA
|
|||||||
OBJS += ggml-cuda.o
|
OBJS += ggml-cuda.o
|
||||||
NVCC = nvcc
|
NVCC = nvcc
|
||||||
NVCCFLAGS = --forward-unknown-to-host-compiler
|
NVCCFLAGS = --forward-unknown-to-host-compiler
|
||||||
|
NVCCV := $(shell $(NVCC) --version | tail -n 1)
|
||||||
ifdef LLAMA_DEBUG
|
ifdef LLAMA_DEBUG
|
||||||
NVCCFLAGS += -lineinfo
|
NVCCFLAGS += -lineinfo
|
||||||
endif # LLAMA_DEBUG
|
endif # LLAMA_DEBUG
|
||||||
|
@ -14,7 +14,7 @@ template<> struct vec2_t_impl<float> { typedef float2 type; };
|
|||||||
template<typename T> using vec2_t = typename vec2_t_impl<T>::type;
|
template<typename T> using vec2_t = typename vec2_t_impl<T>::type;
|
||||||
|
|
||||||
template<typename T> inline __host__ __device__ vec2_t<T> make_vec2_t(const T & x, const T & y);
|
template<typename T> inline __host__ __device__ vec2_t<T> make_vec2_t(const T & x, const T & y);
|
||||||
template<> inline __host__ __device__ vec2_t<half> make_vec2_t(const half & x, const half & y) { return __halves2half2(x, y); }
|
template<> inline __host__ __device__ vec2_t<half> make_vec2_t(const half & x, const half & y) { return make_half2 (x, y); }
|
||||||
template<> inline __host__ __device__ vec2_t<float> make_vec2_t(const float & x, const float & y) { return make_float2(x, y); }
|
template<> inline __host__ __device__ vec2_t<float> make_vec2_t(const float & x, const float & y) { return make_float2(x, y); }
|
||||||
|
|
||||||
// the cuda headers define operators for half2, but not for float2
|
// the cuda headers define operators for half2, but not for float2
|
||||||
|
Loading…
Reference in New Issue
Block a user