ci: split llama-server and tabby release (#2116) #320
Workflow file for this run
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
name: Build and release binaries. | |
on: | |
workflow_dispatch: | |
push: | |
tags: | |
- 'v*' | |
- 'nightly' | |
- '!*-dev' | |
pull_request: | |
branches: [ "main" ] | |
paths: | |
- '.github/workflows/release.yml' | |
concurrency: | |
group: ${{ github.workflow_ref }}-${{ github.head_ref || github.ref_name }} | |
# If this is enabled it will cancel current running and start latest | |
cancel-in-progress: true | |
env: | |
RUST_TOOLCHAIN: 1.76.0 | |
jobs: | |
release-llama-server-binary: | |
runs-on: ${{ matrix.os }} | |
container: ${{ matrix.container }} | |
strategy: | |
matrix: | |
binary: | |
- aarch64-apple-darwin | |
- x86_64-manylinux2014 | |
- x86_64-manylinux2014-cuda117 | |
- x86_64-manylinux2014-cuda122 | |
- x86_64-manylinux2014-vulkan | |
- x86_64-windows-msvc | |
- x86_64-windows-msvc-vulkan | |
- x86_64-windows-msvc-cuda117 | |
- x86_64-windows-msvc-cuda122 | |
include: | |
- os: macos-latest | |
target: aarch64-apple-darwin | |
binary: aarch64-apple-darwin | |
build_args: --features binary | |
- os: buildjet-2vcpu-ubuntu-2204 | |
target: x86_64-unknown-linux-gnu | |
binary: x86_64-manylinux2014 | |
container: quay.io/pypa/manylinux2014_x86_64 | |
build_args: --features binary | |
- os: buildjet-2vcpu-ubuntu-2204 | |
target: x86_64-unknown-linux-gnu | |
binary: x86_64-manylinux2014-cuda117 | |
container: sameli/manylinux2014_x86_64_cuda_11.7 | |
build_args: --features binary,cuda | |
- os: buildjet-2vcpu-ubuntu-2204 | |
target: x86_64-unknown-linux-gnu | |
binary: x86_64-manylinux2014-cuda122 | |
container: sameli/manylinux2014_x86_64_cuda_12.2 | |
build_args: --features binary,cuda | |
- os: buildjet-2vcpu-ubuntu-2204 | |
target: x86_64-unknown-linux-gnu | |
binary: x86_64-manylinux2014-vulkan | |
container: quay.io/pypa/manylinux2014_x86_64 | |
build_args: --features binary,vulkan | |
vulkan_sdk: '1.3.239.0' | |
- os: windows-latest | |
target: x86_64-pc-windows-msvc | |
binary: x86_64-windows-msvc | |
build_args: --features binary | |
ext: .exe | |
- os: windows-latest | |
target: x86_64-pc-windows-msvc | |
binary: x86_64-windows-msvc-vulkan | |
ext: .exe | |
build_args: --features vulkan,binary | |
vulkan_sdk: '1.3.280.0' | |
- os: windows-latest | |
target: x86_64-pc-windows-msvc | |
binary: x86_64-windows-msvc-cuda117 | |
ext: .exe | |
build_args: --features cuda,binary | |
windows_cuda: '11.7.1' | |
- os: windows-latest | |
target: x86_64-pc-windows-msvc | |
binary: x86_64-windows-msvc-cuda122 | |
ext: .exe | |
build_args: --features cuda,binary | |
windows_cuda: '12.2.0' | |
env: | |
SCCACHE_GHA_ENABLED: true | |
RUSTC_WRAPPER: sccache | |
CARGO_INCREMENTAL: 0 | |
steps: | |
- name: Checkout | |
uses: actions/checkout@v3 | |
with: | |
submodules: recursive | |
- name: Install Rust | |
uses: actions-rs/toolchain@v1 | |
with: | |
toolchain: ${{ env.RUST_TOOLCHAIN }} | |
target: ${{ matrix.target }} | |
components: clippy | |
- name: Set default rust version | |
run: rustup default ${{ env.RUST_TOOLCHAIN }} | |
- name: Sccache cache | |
uses: mozilla-actions/[email protected] | |
with: | |
version: "v0.4.0" | |
- name: Cargo registry cache | |
uses: actions/cache@v3 | |
with: | |
key: cargo-${{ runner.os }}-${{ hashFiles('**/Cargo.toml') }}-${{ github.sha }} | |
restore-keys: | | |
cargo-${{ runner.os }}-${{ hashFiles('**/Cargo.toml') }}- | |
cargo-${{ runner.os }}- | |
path: | | |
~/.cargo/registry | |
~/.cargo/git | |
- name: Prepare build environment for macOS & Linux | |
run: bash ./ci/prepare_build_environment.sh | |
if: runner.os != 'Windows' | |
- name: Prepare build environment for Windows | |
run: ./ci/prepare_build_environment.ps1 | |
if: runner.os == 'Windows' | |
- name: Install CUDA toolkit for Windows | |
uses: Jimver/[email protected] | |
with: | |
cuda: ${{ matrix.windows_cuda }} | |
method: 'network' | |
sub-packages: '["nvcc", "cudart", "cublas", "cublas_dev", "thrust", "visual_studio_integration"]' | |
if: runner.os == 'Windows' && matrix.windows_cuda != '' | |
- name: Install Vulkan SDK | |
uses: icycodes/[email protected] | |
with: | |
version: ${{ matrix.vulkan_sdk }} | |
cache: true | |
if: matrix.vulkan_sdk != '' | |
- name: Bulid release binary | |
run: cargo build ${{ matrix.build_args }} --release --target ${{ matrix.target }} --package llama-cpp-server | |
- name: Rename release binary | |
run: mv target/${{ matrix.target }}/release/llama-server${{ matrix.ext }} llama-server_${{ matrix.binary }}${{ matrix.ext }} | |
- name: Upload artifacts | |
uses: actions/upload-artifact@v3 | |
with: | |
retention-days: 3 | |
name: llama-server_${{ matrix.binary }}${{ matrix.ext }} | |
path: llama-server_${{ matrix.binary }}${{ matrix.ext }} | |
release-binary: | |
runs-on: ${{ matrix.os }} | |
container: ${{ matrix.container }} | |
strategy: | |
matrix: | |
binary: | |
- aarch64-apple-darwin | |
- x86_64-manylinux2014 | |
- x86_64-windows-msvc | |
include: | |
- os: macos-latest | |
target: aarch64-apple-darwin | |
binary: aarch64-apple-darwin | |
build_args: --no-default-features --features prod | |
- os: buildjet-2vcpu-ubuntu-2204 | |
target: x86_64-unknown-linux-gnu | |
binary: x86_64-manylinux2014 | |
container: quay.io/pypa/manylinux2014_x86_64 | |
build_args: --no-default-features --features static-ssl,prod | |
- os: windows-latest | |
target: x86_64-pc-windows-msvc | |
binary: x86_64-windows-msvc | |
build_args: --no-default-features --features prod | |
ext: .exe | |
env: | |
SCCACHE_GHA_ENABLED: true | |
RUSTC_WRAPPER: sccache | |
CARGO_INCREMENTAL: 0 | |
steps: | |
- name: Checkout | |
uses: actions/checkout@v3 | |
with: | |
submodules: recursive | |
- name: Install Rust | |
uses: actions-rs/toolchain@v1 | |
with: | |
toolchain: ${{ env.RUST_TOOLCHAIN }} | |
target: ${{ matrix.target }} | |
components: clippy | |
- name: Set default rust version | |
run: rustup default ${{ env.RUST_TOOLCHAIN }} | |
- name: Sccache cache | |
uses: mozilla-actions/[email protected] | |
with: | |
version: "v0.4.0" | |
- name: Cargo registry cache | |
uses: actions/cache@v3 | |
with: | |
key: cargo-${{ runner.os }}-${{ hashFiles('**/Cargo.toml') }}-${{ github.sha }} | |
restore-keys: | | |
cargo-${{ runner.os }}-${{ hashFiles('**/Cargo.toml') }}- | |
cargo-${{ runner.os }}- | |
path: | | |
~/.cargo/registry | |
~/.cargo/git | |
- name: Prepare build environment for macOS & Linux | |
run: bash ./ci/prepare_build_environment.sh | |
if: runner.os != 'Windows' | |
- name: Prepare build environment for Windows | |
run: ./ci/prepare_build_environment.ps1 | |
if: runner.os == 'Windows' | |
- name: Bulid release binary | |
run: cargo build ${{ matrix.build_args }} --release --target ${{ matrix.target }} --package tabby | |
- name: Rename release binary | |
run: mv target/${{ matrix.target }}/release/tabby${{ matrix.ext }} tabby_${{ matrix.binary }}${{ matrix.ext }} | |
- name: Upload artifacts | |
uses: actions/upload-artifact@v3 | |
with: | |
retention-days: 3 | |
name: tabby_${{ matrix.binary }}${{ matrix.ext }} | |
path: tabby_${{ matrix.binary }}${{ matrix.ext }} | |
pre-release: | |
if: github.event_name == 'push' | |
needs: [release-llama-server-binary, release-binary] | |
runs-on: ubuntu-latest | |
permissions: | |
contents: write | |
steps: | |
- name: Download all artifacts | |
uses: actions/download-artifact@v3 | |
- uses: ncipollo/release-action@v1 | |
with: | |
allowUpdates: true | |
prerelease: true | |
artifacts: "tabby_*/tabby_*,llama-server_*/llama-server_*" | |
tag: ${{ github.ref_name }} | |
removeArtifacts: true |