@@ -16,11 +16,6 @@ concurrency:
16
16
group : ${{ github.workflow }}-${{ github.head_ref && github.ref || github.run_id }}
17
17
cancel-in-progress : true
18
18
19
- # Fine-grant permission
20
- # https://docs.github.com/en/actions/security-for-github-actions/security-guides/automatic-token-authentication#modifying-the-permissions-for-the-github_token
21
- permissions :
22
- contents : write # for creating release
23
-
24
19
env :
25
20
BRANCH_NAME : ${{ github.head_ref || github.ref_name }}
26
21
CMAKE_ARGS : " -DLLAMA_BUILD_EXAMPLES=OFF -DLLAMA_BUILD_TESTS=OFF -DLLAMA_BUILD_TOOLS=ON -DLLAMA_BUILD_SERVER=ON -DGGML_RPC=ON"
@@ -416,28 +411,27 @@ jobs:
416
411
CURL_PATH : ${{ steps.get_libcurl.outputs.curl_path }}
417
412
run : |
418
413
cp $env:CURL_PATH\bin\libcurl-x64.dll .\build\bin\Release\libcurl-x64.dll
419
- 7z a llama-${{ steps.tag.outputs.name }}-bin-win-${{ matrix.build }}-cu ${{ matrix.cuda }}-x64.zip .\build\bin\Release\*
414
+ 7z a llama-${{ steps.tag.outputs.name }}-bin-win-cuda ${{ matrix.cuda }}-x64.zip .\build\bin\Release\*
420
415
421
416
- name : Upload artifacts
422
417
uses : actions/upload-artifact@v4
423
418
with :
424
- path : llama-${{ steps.tag.outputs.name }}-bin-win-${{ matrix.build }}-cu ${{ matrix.cuda }}-x64.zip
425
- name : llama-bin-win-cu ${{ matrix.cuda }}-x64.zip
419
+ path : llama-${{ steps.tag.outputs.name }}-bin-win-cuda ${{ matrix.cuda }}-x64.zip
420
+ name : llama-bin-win-cuda ${{ matrix.cuda }}-x64.zip
426
421
427
422
- name : Copy and pack Cuda runtime
428
- if : ${{ github.event_name == 'push' && github.ref == 'refs/heads/master' }}
429
423
run : |
430
424
echo "Cuda install location: ${{ env.CUDA_PATH }}"
431
425
$dst='.\build\bin\cudart\'
432
426
robocopy "${{env.CUDA_PATH}}\bin" $dst cudart64_*.dll cublas64_*.dll cublasLt64_*.dll
433
427
robocopy "${{env.CUDA_PATH}}\lib" $dst cudart64_*.dll cublas64_*.dll cublasLt64_*.dll
434
- 7z a cudart-llama-bin-win-cu ${{ matrix.cuda }}-x64.zip $dst\*
428
+ 7z a cudart-llama-bin-win-cuda ${{ matrix.cuda }}-x64.zip $dst\*
435
429
436
430
- name : Upload Cuda runtime
437
431
uses : actions/upload-artifact@v4
438
432
with :
439
- path : cudart-llama-bin-win-cu ${{ matrix.cuda }}-x64.zip
440
- name : cudart-llama-bin-win-cu ${{ matrix.cuda }}-x64.zip
433
+ path : cudart-llama-bin-win-cuda ${{ matrix.cuda }}-x64.zip
434
+ name : cudart-llama-bin-win-cuda ${{ matrix.cuda }}-x64.zip
441
435
442
436
windows-sycl :
443
437
runs-on : windows-latest
@@ -646,6 +640,11 @@ jobs:
646
640
release :
647
641
if : ${{ ( github.event_name == 'push' && github.ref == 'refs/heads/master' ) || github.event.inputs.create_release == 'true' }}
648
642
643
+ # Fine-grant permission
644
+ # https://docs.github.com/en/actions/security-for-github-actions/security-guides/automatic-token-authentication#modifying-the-permissions-for-the-github_token
645
+ permissions :
646
+ contents : write # for creating release
647
+
649
648
runs-on : ubuntu-latest
650
649
651
650
needs :
0 commit comments