We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 0fd8363 commit 54a63c1Copy full SHA for 54a63c1
Makefile
@@ -108,8 +108,15 @@ ggml-cuda.o: ggml-cuda.cu ggml-cuda.h
108
nvcc -arch=native -c -o $@ $<
109
endif
110
ifdef LLAMA_HIPBLAS
111
- CFLAGS += -DGGML_USE_HIPBLAS -D__HIP_PLATFORM_AMD__ -I/opt/rocm/include
112
- LDFLAGS += -lhipblas -lamdhip64 -L/opt/rocm/lib
+ ROCMPATH?= /opt/rocm
+ CFLAGS += -DGGML_USE_HIPBLAS -D__HIP_PLATFORM_AMD__ -I$(ROCMPATH)/include
113
+ CXXFLAGS+= -D__HIP_PLATFORM_AMD__ -I$(ROCMPATH)/include
114
+ HIPFLAGS?= -amdgpu-early-inline-all=true -amdgpu-function-calls=false -march=native
115
+ LDFLAGS += -lhipblas -lamdhip64 -L$(ROCMPATH)/lib
116
+ HIPCC ?= $(ROCMPATH)/bin/hipcc
117
+ OBJS += ggml-cuda.o
118
+ggml-cuda.o: ggml-cuda.cu ggml-cuda.h
119
+ $(HIPCC) $(CXXFLAGS) -x hip $(HIPFLAGS) -c -o $@ $<
120
121
ifdef LLAMA_GPROF
122
CFLAGS += -pg
0 commit comments