diff --git a/.github/workflows/llama-build-cuda.yaml b/.github/workflows/llama-build-cuda.yaml index 7bd8e3a..779f12c 100644 --- a/.github/workflows/llama-build-cuda.yaml +++ b/.github/workflows/llama-build-cuda.yaml @@ -21,7 +21,7 @@ jobs: run: | $matrix = @{ 'os' = @('ubuntu-24.04') - 'pyver' = @("3.13", "3.14") + 'pyver' = @("3.14") 'cuda' = @("13.1.1") 'releasetag' = @("basic") } @@ -92,6 +92,7 @@ jobs: $env:CMAKE_ARGS = '-DGGML_CUDA=on -DLLAVA_BUILD=off -DCMAKE_CUDA_ARCHITECTURES=75;80;' $env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=OFF $env:CMAKE_ARGS" $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX2=off -DGGML_FMA=off -DGGML_F16C=off' + $env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DCMAKE_C_FLAGS="-march=x86-64" -DCMAKE_CXX_FLAGS="-march=x86-64"' # Rename the release version with +cu{cuda_ver} build tag (Get-Content llama_cpp/__init__.py) -replace '__version__ = "([^"]*)"', ('__version__ = "' + '$1' + '+cu' + $cudaVersion + '"') | Set-Content llama_cpp/__init__.py @@ -118,3 +119,4 @@ jobs: +