@@ -13,8 +13,8 @@ ifndef UNAME_M
13
13
UNAME_M := $(shell uname -m)
14
14
endif
15
15
16
- CCV : = $(shell $(CC ) --version | head -n 1)
17
- CXXV : = $(shell $(CXX ) --version | head -n 1)
16
+ CCV = $(shell $(CC ) --version | head -n 1)
17
+ CXXV = $(shell $(CXX ) --version | head -n 1)
18
18
19
19
# Mac OS + Arm can report x86_64
20
20
# ref: https://github.com/ggerganov/whisper.cpp/issues/66#issuecomment-1282546789
@@ -108,14 +108,17 @@ ggml-cuda.o: ggml-cuda.cu ggml-cuda.h
108
108
nvcc -arch=native -c -o $@ $<
109
109
endif
110
110
ifdef LLAMA_HIPBLAS
111
- ROCM_PATH ?= /opt/rocm
112
- LDFLAGS += -lhipblas -lamdhip64 -L$(ROCM_PATH)/lib -Wl,-rpath=$(ROCM_PATH)/lib
113
- HIPCC ?= $(ROCM_PATH)/bin/hipcc
114
- OBJS += ggml-cuda.o
115
- ggml.o : CFLAGS += -DGGML_USE_HIPBLAS -D__HIP_PLATFORM_AMD__ -I$(ROCM_PATH ) /include
116
- ggml-cuda.o : CXXFLAGS += -march=native -D__HIP_PLATFORM_AMD__ -I$(ROCMPATH ) /include
111
+ ROCM_PATH ?= /opt/rocm
112
+ CC := $(ROCM_PATH)/llvm/bin/clang
113
+ CXX := $(ROCM_PATH)/llvm/bin/clang++
114
+ GPU_TARGETS!= $(ROCM_PATH)/llvm/bin/offload-arch
115
+ CFLAGS += -DGGML_USE_HIPBLAS $(shell $(ROCM_PATH)/bin/hipconfig -C)
116
+ CXXFLAGS += -DGGML_USE_HIPBLAS $(shell $(ROCM_PATH)/bin/hipconfig -C)
117
+ LDFLAGS += -L/opt/rocm/lib -lhipblas -lamdhip64
118
+ OBJS += ggml-cuda.o
119
+ ggml-cuda.o : CXXFLAGS += $(addprefix --offload-arch=,$(GPU_TARGETS ) )
117
120
ggml-cuda.o : ggml-cuda.cu ggml-cuda.h
118
- $(HIPCC ) $(CXXFLAGS ) -x hip $( HIPFLAGS ) -c -o $@ $<
121
+ $(CXX ) $(CXXFLAGS ) -x hip -c -o $@ $<
119
122
endif
120
123
ifdef LLAMA_GPROF
121
124
CFLAGS += -pg
0 commit comments