@@ -228,21 +228,24 @@ NVCCFLAGS += -Wno-deprecated-gpu-targets \
228228 -gencode arch=compute_61,code=compute_61 \
229229 -gencode arch=compute_70,code=compute_70 \
230230 -gencode arch=compute_75,code=compute_75 \
231- -DKCPP_LIMIT_CUDA_MAX_ARCH=750
231+ -DKCPP_LIMIT_CUDA_MAX_ARCH=750 \
232+ -DKCPP_BACKUP_CUDA_ARCH_REF="35,50,61,70,75"
232233
233234else ifdef LLAMA_ARCHES_CU12
234235NVCCFLAGS += -Wno-deprecated-gpu-targets \
235236 -gencode arch=compute_50,code=compute_50 \
236237 -gencode arch=compute_61,code=compute_61 \
237238 -gencode arch=compute_70,code=compute_70 \
238239 -gencode arch=compute_75,code=compute_75 \
239- -gencode arch=compute_80,code=compute_80
240+ -gencode arch=compute_80,code=compute_80 \
241+ -DKCPP_BACKUP_CUDA_ARCH_REF="50,61,70,75,80"
240242
241243else ifdef LLAMA_ARCHES_CU13
242244NVCCFLAGS += -Wno-deprecated-gpu-targets \
243245 -gencode arch=compute_75,code=compute_75 \
244246 -gencode arch=compute_80,code=compute_80 \
245- -gencode arch=compute_86,code=compute_86
247+ -gencode arch=compute_86,code=compute_86 \
248+ -DKCPP_BACKUP_CUDA_ARCH_REF="75,80,86"
246249
247250else
248251NVCCFLAGS += -Wno-deprecated-gpu-targets -arch=all
0 commit comments