PyPI - llama-cpp-bin - Versions diffs - 9093.0.0__tar.gz - Mend

llama-cpp-bin 9093.0.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (983) hide show

llama_cpp_bin-9093.0.0/.github/scripts/generate-pep503-index.py ADDED Viewed

@@ -0,0 +1,67 @@
+#!/usr/bin/env python3
+import json
+import os
+import urllib.request
+from pathlib import Path
+REPO = os.environ["REPO"]
+TAG = os.environ["TAG"]
+TOKEN = os.environ["GITHUB_TOKEN"]
+API_URL = f"https://api.github.com/repos/{REPO}/releases/tags/{TAG}"
+HEADERS = {
+    "Authorization": f"Bearer {TOKEN}",
+    "Accept": "application/vnd.github+json",
+    "X-GitHub-Api-Version": "2022-11-28",
+}
+def fetch_release():
+    req = urllib.request.Request(API_URL, headers=HEADERS)
+    with urllib.request.urlopen(req) as resp:
+        return json.loads(resp.read())
+def generate_index():
+    release = fetch_release()
+    assets = [
+        a
+        for a in release.get("assets", [])
+        if a["name"].endswith(".whl") or a["name"].endswith(".tar.gz")
+    ]
+    site = Path("site")
+    simple = site / "simple"
+    pkg_dir = simple / "llama-cpp-bin"
+    pkg_dir.mkdir(parents=True, exist_ok=True)
+    root_html = (
+        "<!DOCTYPE html>\n"
+        "<html>\n"
+        "<body>\n"
+        '<a href="llama-cpp-bin/">llama-cpp-bin</a>\n'
+        "</body>\n"
+        "</html>"
+    )
+    (simple / "index.html").write_text(root_html, encoding="utf-8")
+    links = []
+    for asset in assets:
+        links.append(f'<a href="{asset["browser_download_url"]}">{asset["name"]}</a>')
+    pkg_html = (
+        "<!DOCTYPE html>\n"
+        "<html>\n"
+        "<body>\n"
+        + "\n".join(links)
+        + "\n</body>\n"
+        "</html>"
+    )
+    (pkg_dir / "index.html").write_text(pkg_html, encoding="utf-8")
+    print(f"Generated index with {len(assets)} assets")
+if __name__ == "__main__":
+    generate_index()

llama_cpp_bin-9093.0.0/.github/workflows/build-everything.yml ADDED Viewed

@@ -0,0 +1,131 @@
+name: Build Everything
+on:
+  push:
+    tags:
+      - 'v*'
+  workflow_dispatch:
+    inputs:
+      version:
+        description: 'Git ref to build (tag recommended for releases, e.g. v0.1.0)'
+        required: true
+        type: string
+permissions:
+  contents: write
+jobs:
+  build_cuda_wheels_windows:
+    name: CUDA Wheels Windows
+    uses: ./.github/workflows/build-wheels-cuda.yml
+    with:
+      version: ${{ github.event_name == 'push' && github.ref_name || inputs.version }}
+      config: 'os:windows-2022'
+  build_cuda_wheels_linux:
+    name: CUDA Wheels Linux
+    uses: ./.github/workflows/build-wheels-cuda.yml
+    with:
+      version: ${{ github.event_name == 'push' && github.ref_name || inputs.version }}
+      config: 'os:ubuntu-22.04'
+  build_vulkan_wheels_windows:
+    name: Vulkan Wheels Windows
+    uses: ./.github/workflows/build-wheels-vulkan.yml
+    with:
+      version: ${{ github.event_name == 'push' && github.ref_name || inputs.version }}
+      config: 'os:windows-2022'
+  build_vulkan_wheels_linux:
+    name: Vulkan Wheels Linux
+    uses: ./.github/workflows/build-wheels-vulkan.yml
+    with:
+      version: ${{ github.event_name == 'push' && github.ref_name || inputs.version }}
+      config: 'os:ubuntu-22.04'
+  build_wheels_cpu:
+    name: CPU-only Wheels
+    uses: ./.github/workflows/build-wheels-cpu.yml
+    with:
+      version: ${{ github.event_name == 'push' && github.ref_name || inputs.version }}
+  build_wheels_macos:
+    name: MacOS Wheels
+    uses: ./.github/workflows/build-wheels-macos.yml
+    with:
+      version: ${{ github.event_name == 'push' && github.ref_name || inputs.version }}
+  build_wheels_rocm:
+    name: ROCm Wheels
+    uses: ./.github/workflows/build-wheels-rocm.yml
+    with:
+      version: ${{ github.event_name == 'push' && github.ref_name || inputs.version }}
+  build-sdist:
+    name: Build Source Distribution
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v6
+        with:
+          submodules: 'recursive'
+      - uses: actions/setup-python@v6
+        with:
+          python-version: "3.11"
+      - run: python -m pip install build
+      - run: python -m build --sdist
+      - uses: actions/upload-artifact@v6
+        with:
+          name: sdist
+          path: dist/*.tar.gz
+      - name: Upload sdist to release
+        uses: svenstaro/upload-release-action@2.7.0
+        with:
+          repo_token: ${{ secrets.GITHUB_TOKEN }}
+          file: ./dist/*.tar.gz
+          tag: ${{ github.event_name == 'push' && github.ref_name || inputs.version }}
+          file_glob: true
+          overwrite: true
+  publish-pypi:
+    name: Publish to PyPI
+    needs: build-sdist
+    runs-on: ubuntu-latest
+    environment: pypi
+    permissions:
+      id-token: write
+    steps:
+      - uses: actions/download-artifact@v6
+        with:
+          name: sdist
+          path: dist
+      - uses: pypa/gh-action-pypi-publish@release/v1
+        with:
+          packages-dir: dist
+  generate-index:
+    name: Generate PEP 503 Index
+    needs:
+      - build_wheels_cpu
+      - build_wheels_macos
+      - build_cuda_wheels_linux
+      - build_cuda_wheels_windows
+      - build_wheels_rocm
+      - build_vulkan_wheels_linux
+      - build_vulkan_wheels_windows
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v6
+      - uses: actions/setup-python@v6
+        with:
+          python-version: "3.11"
+      - name: Generate index
+        env:
+          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+          REPO: ${{ github.repository }}
+          TAG: ${{ github.event_name == 'push' && github.ref_name || inputs.version }}
+        run: python .github/scripts/generate-pep503-index.py
+      - name: Deploy to GitHub Pages
+        uses: peaceiris/actions-gh-pages@v4
+        with:
+          github_token: ${{ secrets.GITHUB_TOKEN }}
+          publish_dir: ./site

llama_cpp_bin-9093.0.0/.github/workflows/build-wheels-cpu.yml ADDED Viewed

@@ -0,0 +1,140 @@
+name: Build CPU Wheels
+on:
+  workflow_dispatch:
+    inputs:
+      version:
+        description: 'Git ref to build (tag recommended for releases, e.g. v0.1.0)'
+        required: true
+        type: string
+      config:
+        description: 'Override configurations to build: key1:item1-1,item1-2;key2:item2-1,item2-2'
+        default: 'Default'
+        required: false
+        type: string
+      exclude:
+        description: 'Exclude build configurations: key1-1:item1-1,key1-2:item1-2;key2-1:item2-1,key2-2:item2-2'
+        default: 'None'
+        required: false
+        type: string
+  workflow_call:
+    inputs:
+      version:
+        description: 'Git ref to build'
+        required: true
+        type: string
+      config:
+        description: 'Configurations to build: key1:item1-1,item1-2;key2:item2-1,item2-2'
+        default: 'Default'
+        required: false
+        type: string
+      exclude:
+        description: 'Exclude build configurations: key1-1:item1-1,key1-2:item1-2;key2-1:item2-1,key2-2:item2-2'
+        default: 'None'
+        required: false
+        type: string
+permissions:
+  contents: write
+jobs:
+  define_matrix:
+    name: Define Build Matrix
+    runs-on: ubuntu-latest
+    outputs:
+      matrix: ${{ steps.set-matrix.outputs.matrix }}
+    defaults:
+      run:
+        shell: pwsh
+    env:
+      CONFIGIN: ${{ inputs.config }}
+      EXCLUDEIN: ${{ inputs.exclude }}
+    steps:
+      - name: Define Job Output
+        id: set-matrix
+        run: |
+          $matrix = @{
+              'os' = @('ubuntu-22.04', 'windows-2022')
+              'pyver' = @("3.11")
+          }
+          if ($env:CONFIGIN -ne 'Default') {$env:CONFIGIN.split(';').foreach({$matrix[$_.split(':')[0]] = $_.split(':')[1].split(',')})}
+          if ($env:EXCLUDEIN -ne 'None') {
+              $exclusions = @()
+              $exclusions += $env:EXCLUDEIN.split(';').replace(':','=').replace(',',"`n") | ConvertFrom-StringData
+              $matrix['exclude'] = $exclusions
+          }
+          $matrixOut = ConvertTo-Json $matrix -Compress
+          Write-Output ('matrix=' + $matrixOut) >> $env:GITHUB_OUTPUT
+  build_wheels:
+    name: ${{ matrix.os }} CPU
+    needs: define_matrix
+    runs-on: ${{ matrix.os }}
+    strategy:
+      matrix: ${{ fromJSON(needs.define_matrix.outputs.matrix) }}
+    defaults:
+      run:
+        shell: pwsh
+    steps:
+      - uses: actions/checkout@v6
+        with:
+          repository: 'vladlearns/llama-cpp-bin'
+          ref: ${{ inputs.version }}
+          submodules: 'recursive'
+      - name: Install Ninja
+        if: runner.os == 'Windows'
+        run: choco install ninja
+      - name: Setup MSVC
+        if: runner.os == 'Windows'
+        uses: ilammy/msvc-dev-cmd@v1
+      - uses: actions/setup-python@v6
+        with:
+          python-version: ${{ matrix.pyver }}
+      - name: Install Dependencies
+        run: |
+          if ($IsLinux) {
+            sudo apt-get update
+            sudo apt-get install -y build-essential libssl-dev
+          }
+          python -m pip install build
+      - name: Build Wheel
+        run: |
+          $env:VERBOSE = '1'
+          $env:CMAKE_ARGS = "-DCMAKE_BUILD_TYPE=Release -DGGML_NATIVE=off -DGGML_BACKEND_DL=on -DGGML_CPU_ALL_VARIANTS=on -DGGML_RPC=on -DLLAMA_BUILD_TESTS=off -DLLAMA_BUILD_EXAMPLES=off"
+          if ($IsWindows) {
+            $env:CMAKE_ARGS += " -G 'Ninja' -DLLAMA_BUILD_BORINGSSL=ON"
+          }
+          $env:LLAMA_CPP_BUILD_JOBS = "2"
+          $buildtag = "+cpu"
+          python -m build --wheel -C--build-option=egg_info "-C--build-option=--tag-build=$buildtag"
+      - name: Upload files to a GitHub release
+        id: upload-release
+        uses: svenstaro/upload-release-action@2.7.0
+        continue-on-error: true
+        with:
+          repo_token: ${{ secrets.GITHUB_TOKEN }}
+          file: ./dist/*.whl
+          tag: ${{ inputs.version }}
+          release_name: ${{ inputs.version }}
+          file_glob: true
+          make_latest: false
+          overwrite: true
+      - uses: actions/upload-artifact@v6
+        if: steps.upload-release.outcome == 'failure'
+        with:
+          name: cpu-${{ runner.os }}
+          path: ./dist/*.whl

llama_cpp_bin-9093.0.0/.github/workflows/build-wheels-cuda.yml ADDED Viewed

@@ -0,0 +1,215 @@
+name: Build CUDA Wheels
+on:
+  workflow_dispatch:
+    inputs:
+      version:
+        description: 'Git ref to build (tag recommended for releases, e.g. v0.1.0)'
+        required: true
+        type: string
+      config:
+        description: 'Override configurations to build: key1:item1-1,item1-2;key2:item2-1,item2-2'
+        default: 'Default'
+        required: false
+        type: string
+      exclude:
+        description: 'Exclude build configurations: key1-1:item1-1,key1-2:item1-2;key2-1:item2-1,key2-2:item2-2'
+        default: 'None'
+        required: false
+        type: string
+  workflow_call:
+    inputs:
+      version:
+        description: 'Git ref to build'
+        required: true
+        type: string
+      config:
+        description: 'Configurations to build: key1:item1-1,item1-2;key2:item2-1,item2-2'
+        default: 'Default'
+        required: false
+        type: string
+      exclude:
+        description: 'Exclude build configurations: key1-1:item1-1,key1-2:item1-2;key2-1:item2-1,key2-2:item2-2'
+        default: 'None'
+        required: false
+        type: string
+permissions:
+  contents: write
+jobs:
+  define_matrix:
+    name: Define Build Matrix
+    runs-on: ubuntu-latest
+    outputs:
+      matrix: ${{ steps.set-matrix.outputs.matrix }}
+    defaults:
+      run:
+        shell: pwsh
+    env:
+      CONFIGIN: ${{ inputs.config }}
+      EXCLUDEIN: ${{ inputs.exclude }}
+    steps:
+      - name: Define Job Output
+        id: set-matrix
+        run: |
+          $matrix = @{
+              'os' = @('ubuntu-22.04', 'windows-2022')
+              'pyver' = @("3.11")
+              'cuda' = @("12.4.1", "13.1.0")
+          }
+          if ($env:CONFIGIN -ne 'Default') {$env:CONFIGIN.split(';').foreach({$matrix[$_.split(':')[0]] = $_.split(':')[1].split(',')})}
+          if ($env:EXCLUDEIN -ne 'None') {
+              $exclusions = @()
+              $exclusions += $env:EXCLUDEIN.split(';').replace(':','=').replace(',',"`n") | ConvertFrom-StringData
+              $matrix['exclude'] = $exclusions
+          }
+          $matrixOut = ConvertTo-Json $matrix -Compress
+          Write-Output ('matrix=' + $matrixOut) >> $env:GITHUB_OUTPUT
+  build_wheels:
+    name: ${{ matrix.os }} CUDA ${{ matrix.cuda }}
+    needs: define_matrix
+    runs-on: ${{ matrix.os }}
+    strategy:
+      matrix: ${{ fromJSON(needs.define_matrix.outputs.matrix) }}
+    defaults:
+      run:
+        shell: pwsh
+    env:
+      CUDAVER: ${{ matrix.cuda }}
+    steps:
+      - name: Free Disk Space
+        uses: jlumbroso/free-disk-space@v1.3.1
+        if: runner.os == 'Linux'
+        with:
+          tool-cache: true
+          android: true
+          dotnet: true
+          haskell: true
+          large-packages: false
+          swap-storage: true
+      - uses: actions/checkout@v6
+        with:
+          repository: 'vladlearns/llama-cpp-bin'
+          ref: ${{ inputs.version }}
+          submodules: 'recursive'
+      - name: ccache
+        uses: hendrikmuhs/ccache-action@v1.2.20
+        with:
+          key: cuda-${{ matrix.cuda }}-${{ matrix.os }}
+          variant: ccache
+          evict-old-files: 14d
+      - uses: actions/setup-python@v6
+        with:
+          python-version: ${{ matrix.pyver }}
+      - name: Install CUDA Toolkit
+        uses: Jimver/cuda-toolkit@v0.2.30
+        id: cuda-toolkit
+        with:
+          cuda: ${{ matrix.cuda }}
+          method: 'network'
+      - name: Setup CUDA Environment
+        run: |
+          echo "CUDA_PATH=$env:CUDA_PATH" >> $env:GITHUB_ENV
+          echo "CUDA_HOME=$env:CUDA_PATH" >> $env:GITHUB_ENV
+          if ($IsLinux) {
+            echo "LD_LIBRARY_PATH=$env:CUDA_PATH/lib64:$env:LD_LIBRARY_PATH" >> $env:GITHUB_ENV
+          }
+      - name: Verify CUDA
+        run: nvcc --version
+      - name: Install Ninja
+        if: runner.os == 'Windows'
+        run: choco install ninja
+      - name: Setup MSVC
+        if: runner.os == 'Windows'
+        uses: ilammy/msvc-dev-cmd@v1
+      - name: Install Dependencies
+        run: |
+          if ($IsLinux) {
+            sudo apt-get update
+            sudo apt-get install -y build-essential libssl-dev
+          }
+          python -m pip install build
+      - name: Build Wheel
+        run: |
+          $cudaVersion = $env:CUDAVER.Remove($env:CUDAVER.LastIndexOf('.')).Replace('.','')
+          $env:VERBOSE = '1'
+          $env:CMAKE_ARGS = '-DGGML_CUDA=on -DGGML_CUDA_CUB_3DOT2=on'
+          $env:CMAKE_ARGS = "-DCMAKE_BUILD_TYPE=Release -DGGML_NATIVE=off -DGGML_BACKEND_DL=on -DGGML_CPU_ALL_VARIANTS=on -DGGML_RPC=on -DLLAMA_BUILD_TESTS=off -DLLAMA_BUILD_EXAMPLES=off $env:CMAKE_ARGS"
+          if ($IsWindows) {
+            $env:CMAKE_ARGS += " -G 'Ninja' -DLLAMA_BUILD_BORINGSSL=ON"
+          }
+          $env:LLAMA_CPP_BUILD_JOBS = "2"
+          # Copy CUDA libraries
+          $binDir = "src/llama_cpp_bin/bin"
+          New-Item -ItemType Directory -Force -Path $binDir | Out-Null
+          $cudaMajor = $env:CUDAVER.Split('.')[0]
+          if ($IsLinux) {
+              $libsToFind = @("libcudart.so.$cudaMajor", "libcublas.so.$cudaMajor", "libcublasLt.so.$cudaMajor")
+              foreach ($lib in $libsToFind) {
+                  $foundFiles = Get-ChildItem -Path "$env:CUDA_PATH/lib64" -Filter "$lib*" -File | Select-Object -First 1
+                  if ($foundFiles) {
+                      bash -c "cp -L '$($foundFiles.FullName)' '$binDir/$lib'"
+                      Write-Host "Copied $($foundFiles.FullName) to $binDir/$lib"
+                  } else {
+                      Write-Warning "Could not find $lib"
+                  }
+              }
+          } else {
+              $libsToFind = @("cublas64_$cudaMajor.dll", "cudart64_$cudaMajor.dll", "cublasLt64_$cudaMajor.dll")
+              foreach ($lib in $libsToFind) {
+                  $foundFiles = Get-ChildItem -Path "$env:CUDA_PATH" -Filter $lib -Recurse -File | Select-Object -First 1
+                  if ($foundFiles) {
+                      Copy-Item -Path $foundFiles.FullName -Destination "$binDir/$lib"
+                      Write-Host "Copied $($foundFiles.FullName) to $binDir/$lib"
+                  } else {
+                      Write-Warning "Could not find $lib"
+                  }
+              }
+          }
+          $buildtag = "+cu$cudaVersion"
+          python -m build --wheel -C--build-option=egg_info "-C--build-option=--tag-build=$buildtag"
+      - name: Upload files to a GitHub release
+        id: upload-release
+        uses: svenstaro/upload-release-action@2.7.0
+        continue-on-error: true
+        with:
+          repo_token: ${{ secrets.GITHUB_TOKEN }}
+          file: ./dist/*.whl
+          tag: ${{ inputs.version }}
+          release_name: ${{ inputs.version }}
+          file_glob: true
+          make_latest: false
+          overwrite: true
+      - uses: actions/upload-artifact@v6
+        if: steps.upload-release.outcome == 'failure'
+        with:
+          name: cuda-${{ matrix.cuda }}-${{ runner.os }}
+          path: ./dist/*.whl

llama_cpp_bin-9093.0.0/.github/workflows/build-wheels-macos.yml ADDED Viewed

@@ -0,0 +1,121 @@
+name: Build macOS Wheels
+on:
+  workflow_dispatch:
+    inputs:
+      version:
+        description: 'Git ref to build (tag recommended for releases, e.g. v0.1.0)'
+        required: true
+        type: string
+  workflow_call:
+    inputs:
+      version:
+        description: 'Git ref to build'
+        required: true
+        type: string
+permissions:
+  contents: write
+jobs:
+  build_wheels_arm64:
+    name: macOS ARM64 (Metal)
+    runs-on: macos-14
+    steps:
+      - uses: actions/checkout@v6
+        with:
+          repository: 'vladlearns/llama-cpp-bin'
+          ref: ${{ inputs.version }}
+          submodules: 'recursive'
+      - uses: actions/setup-python@v6
+        with:
+          python-version: "3.11"
+      - name: Install Dependencies
+        run: |
+          python -m pip install build cmake
+      - name: Build Wheel
+        run: |
+          export CMAKE_ARGS="-DCMAKE_BUILD_TYPE=Release -DGGML_NATIVE=off -DGGML_BACKEND_DL=on -DGGML_METAL=on -DGGML_METAL_USE_BF16=on -DGGML_METAL_EMBED_LIBRARY=on -DGGML_RPC=on -DLLAMA_BUILD_BORINGSSL=ON -DLLAMA_BUILD_TESTS=off -DLLAMA_BUILD_EXAMPLES=off"
+          export MACOSX_DEPLOYMENT_TARGET="13.3"
+          export CMAKE_OSX_ARCHITECTURES="arm64"
+          export ARCHFLAGS="-arch arm64"
+          VERBOSE=1 python -m build --wheel
+          for file in ./dist/*universal2.whl; do
+            mv "$file" "${file/universal2/arm64}"
+          done
+      - name: Upload files to a GitHub release
+        id: upload-release
+        uses: svenstaro/upload-release-action@2.7.0
+        continue-on-error: true
+        with:
+          repo_token: ${{ secrets.GITHUB_TOKEN }}
+          file: ./dist/*.whl
+          tag: ${{ inputs.version }}
+          release_name: ${{ inputs.version }}
+          file_glob: true
+          make_latest: false
+          overwrite: true
+      - uses: actions/upload-artifact@v6
+        if: steps.upload-release.outcome == 'failure'
+        with:
+          name: macos-arm64
+          path: ./dist/*.whl
+  build_wheels_x64:
+    name: macOS x64
+    runs-on: macos-15-intel
+    steps:
+      - uses: actions/checkout@v6
+        with:
+          repository: 'vladlearns/llama-cpp-bin'
+          ref: ${{ inputs.version }}
+          submodules: 'recursive'
+      - uses: actions/setup-python@v6
+        with:
+          python-version: "3.11"
+      - name: Install Dependencies
+        run: |
+          python -m pip install build cmake
+      - name: Build Wheel
+        run: |
+          export CMAKE_ARGS="-DCMAKE_BUILD_TYPE=Release -DGGML_NATIVE=off -DGGML_BACKEND_DL=on -DGGML_CPU_ALL_VARIANTS=on -DGGML_METAL=off -DGGML_RPC=on -DLLAMA_BUILD_BORINGSSL=ON -DLLAMA_BUILD_TESTS=off -DLLAMA_BUILD_EXAMPLES=off"
+          export MACOSX_DEPLOYMENT_TARGET="13.3"
+          export CMAKE_OSX_ARCHITECTURES="x86_64"
+          export ARCHFLAGS="-arch x86_64"
+          VERBOSE=1 python -m build --wheel
+          for file in ./dist/*universal2.whl; do
+            mv "$file" "${file/universal2/x86_64}"
+          done
+      - name: Upload files to a GitHub release
+        id: upload-release
+        uses: svenstaro/upload-release-action@2.7.0
+        continue-on-error: true
+        with:
+          repo_token: ${{ secrets.GITHUB_TOKEN }}
+          file: ./dist/*.whl
+          tag: ${{ inputs.version }}
+          release_name: ${{ inputs.version }}
+          file_glob: true
+          make_latest: false
+          overwrite: true
+      - uses: actions/upload-artifact@v6
+        if: steps.upload-release.outcome == 'failure'
+        with:
+          name: macos-x64
+          path: ./dist/*.whl