refactor: remove llama-cpp-bindings, extract supervisor.rs (#2151) #328
Workflow file for this run
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
name: Build and release binaries. | |
on: | |
workflow_dispatch: | |
push: | |
tags: | |
- 'v*' | |
- 'nightly' | |
- '!*-dev' | |
pull_request: | |
branches: [ "main" ] | |
paths: | |
- '.github/workflows/release.yml' | |
concurrency: | |
group: ${{ github.workflow_ref }}-${{ github.head_ref || github.ref_name }} | |
# If this is enabled it will cancel current running and start latest | |
cancel-in-progress: true | |
env: | |
RUST_TOOLCHAIN: 1.76.0 | |
jobs: | |
release-llama-server-binary: | |
runs-on: ${{ matrix.os }} | |
container: ${{ matrix.container }} | |
strategy: | |
matrix: | |
binary: | |
- aarch64-apple-darwin | |
- x86_64-manylinux2014 | |
- x86_64-manylinux2014-cuda117 | |
- x86_64-manylinux2014-cuda122 | |
- x86_64-manylinux2014-vulkan | |
- x86_64-windows-msvc | |
- x86_64-windows-msvc-vulkan | |
- x86_64-windows-msvc-cuda117 | |
- x86_64-windows-msvc-cuda122 | |
include: | |
- os: macos-latest | |
target: aarch64-apple-darwin | |
binary: aarch64-apple-darwin | |
build_args: --features binary | |
- os: buildjet-2vcpu-ubuntu-2204 | |
target: x86_64-unknown-linux-gnu | |
binary: x86_64-manylinux2014 | |
container: quay.io/pypa/manylinux2014_x86_64 | |
build_args: --features binary | |
- os: buildjet-2vcpu-ubuntu-2204 | |
target: x86_64-unknown-linux-gnu | |
binary: x86_64-manylinux2014-cuda117 | |
container: sameli/manylinux2014_x86_64_cuda_11.7 | |
build_args: --features binary,cuda | |
- os: buildjet-2vcpu-ubuntu-2204 | |
target: x86_64-unknown-linux-gnu | |
binary: x86_64-manylinux2014-cuda122 | |
container: sameli/manylinux2014_x86_64_cuda_12.2 | |
build_args: --features binary,cuda | |
- os: buildjet-2vcpu-ubuntu-2204 | |
target: x86_64-unknown-linux-gnu | |
binary: x86_64-manylinux2014-vulkan | |
container: quay.io/pypa/manylinux2014_x86_64 | |
build_args: --features binary,vulkan | |
vulkan_sdk: '1.3.239.0' | |
- os: windows-latest | |
target: x86_64-pc-windows-msvc | |
binary: x86_64-windows-msvc | |
build_args: --features binary | |
ext: .exe | |
- os: windows-latest | |
target: x86_64-pc-windows-msvc | |
binary: x86_64-windows-msvc-vulkan | |
ext: .exe | |
build_args: --features vulkan,binary | |
vulkan_sdk: '1.3.280.0' | |
- os: windows-latest | |
target: x86_64-pc-windows-msvc | |
binary: x86_64-windows-msvc-cuda117 | |
ext: .exe | |
build_args: --features cuda,binary | |
windows_cuda: '11.7.1' | |
- os: windows-latest | |
target: x86_64-pc-windows-msvc | |
binary: x86_64-windows-msvc-cuda122 | |
ext: .exe | |
build_args: --features cuda,binary | |
windows_cuda: '12.2.0' | |
env: | |
SCCACHE_GHA_ENABLED: true | |
RUSTC_WRAPPER: sccache | |
CARGO_INCREMENTAL: 0 | |
steps: | |
- name: Checkout | |
uses: actions/checkout@v3 | |
with: | |
submodules: recursive | |
- name: Install Rust | |
uses: actions-rs/toolchain@v1 | |
with: | |
toolchain: ${{ env.RUST_TOOLCHAIN }} | |
target: ${{ matrix.target }} | |
components: clippy | |
- name: Set default rust version | |
run: rustup default ${{ env.RUST_TOOLCHAIN }} | |
- name: Sccache cache | |
uses: mozilla-actions/[email protected] | |
with: | |
version: "v0.4.0" | |
- name: Cargo registry cache | |
uses: actions/cache@v3 | |
with: | |
key: cargo-${{ runner.os }}-${{ hashFiles('**/Cargo.toml') }}-${{ github.sha }} | |
restore-keys: | | |
cargo-${{ runner.os }}-${{ hashFiles('**/Cargo.toml') }}- | |
cargo-${{ runner.os }}- | |
path: | | |
~/.cargo/registry | |
~/.cargo/git | |
- name: Prepare build environment for macOS & Linux | |
run: bash ./ci/prepare_build_environment.sh | |
if: runner.os != 'Windows' | |
- name: Prepare build environment for Windows | |
run: ./ci/prepare_build_environment.ps1 | |
if: runner.os == 'Windows' | |
- name: Install CUDA toolkit for Windows | |
uses: Jimver/[email protected] | |
with: | |
cuda: ${{ matrix.windows_cuda }} | |
method: 'network' | |
sub-packages: '["nvcc", "cudart", "cublas", "cublas_dev", "thrust", "visual_studio_integration"]' | |
if: runner.os == 'Windows' && matrix.windows_cuda != '' | |
- name: Install Vulkan SDK | |
uses: icycodes/[email protected] | |
with: | |
version: ${{ matrix.vulkan_sdk }} | |
cache: true | |
if: matrix.vulkan_sdk != '' | |
- name: Bulid release binary | |
run: cargo build ${{ matrix.build_args }} --release --target ${{ matrix.target }} --package llama-cpp-server | |
- name: Rename release binary | |
run: mv target/${{ matrix.target }}/release/llama-server${{ matrix.ext }} llama-server_${{ matrix.binary }}${{ matrix.ext }} | |
- name: Upload artifacts | |
uses: actions/upload-artifact@v3 | |
with: | |
retention-days: 3 | |
name: llama-server_${{ matrix.binary }}${{ matrix.ext }} | |
path: llama-server_${{ matrix.binary }}${{ matrix.ext }} | |
release-binary: | |
runs-on: ${{ matrix.os }} | |
container: ${{ matrix.container }} | |
strategy: | |
matrix: | |
binary: | |
- aarch64-apple-darwin | |
- x86_64-manylinux2014 | |
- x86_64-windows-msvc | |
include: | |
- os: macos-latest | |
target: aarch64-apple-darwin | |
binary: aarch64-apple-darwin | |
build_args: --no-default-features --features prod | |
- os: buildjet-2vcpu-ubuntu-2204 | |
target: x86_64-unknown-linux-gnu | |
binary: x86_64-manylinux2014 | |
container: quay.io/pypa/manylinux2014_x86_64 | |
build_args: --no-default-features --features static-ssl,prod | |
- os: windows-latest | |
target: x86_64-pc-windows-msvc | |
binary: x86_64-windows-msvc | |
build_args: --no-default-features --features prod | |
ext: .exe | |
env: | |
SCCACHE_GHA_ENABLED: true | |
RUSTC_WRAPPER: sccache | |
CARGO_INCREMENTAL: 0 | |
steps: | |
- name: Checkout | |
uses: actions/checkout@v3 | |
with: | |
submodules: recursive | |
- name: Install Rust | |
uses: actions-rs/toolchain@v1 | |
with: | |
toolchain: ${{ env.RUST_TOOLCHAIN }} | |
target: ${{ matrix.target }} | |
components: clippy | |
- name: Set default rust version | |
run: rustup default ${{ env.RUST_TOOLCHAIN }} | |
- name: Sccache cache | |
uses: mozilla-actions/[email protected] | |
with: | |
version: "v0.4.0" | |
- name: Cargo registry cache | |
uses: actions/cache@v3 | |
with: | |
key: cargo-${{ runner.os }}-${{ hashFiles('**/Cargo.toml') }}-${{ github.sha }} | |
restore-keys: | | |
cargo-${{ runner.os }}-${{ hashFiles('**/Cargo.toml') }}- | |
cargo-${{ runner.os }}- | |
path: | | |
~/.cargo/registry | |
~/.cargo/git | |
- name: Prepare build environment for macOS & Linux | |
run: bash ./ci/prepare_build_environment.sh | |
if: runner.os != 'Windows' | |
- name: Prepare build environment for Windows | |
run: ./ci/prepare_build_environment.ps1 | |
if: runner.os == 'Windows' | |
- name: Bulid release binary | |
run: cargo build ${{ matrix.build_args }} --release --target ${{ matrix.target }} --package tabby | |
- name: Rename release binary | |
run: mv target/${{ matrix.target }}/release/tabby${{ matrix.ext }} tabby_${{ matrix.binary }}${{ matrix.ext }} | |
- name: Upload artifacts | |
uses: actions/upload-artifact@v3 | |
with: | |
retention-days: 3 | |
name: tabby_${{ matrix.binary }}${{ matrix.ext }} | |
path: tabby_${{ matrix.binary }}${{ matrix.ext }} | |
pre-release: | |
needs: [release-llama-server-binary, release-binary] | |
runs-on: ubuntu-latest | |
permissions: | |
contents: write | |
steps: | |
- name: Download all artifacts | |
uses: actions/download-artifact@v3 | |
- name: Display structure of downloaded files | |
run: ls -R | |
- name: Creating distribution bundles | |
run: > | |
for llama_server in llama-server_*/llama-server_*; do | |
for tabby in tabby_*/tabby_*; do | |
llamab=$(basename $llama_server) | |
tabbyb=$(basename $tabby) | |
llaman=${llamab%.*} | |
tabbyn=${tabbyb%.*} | |
llamav=${llaman#llama-server_} | |
tabbyv=${tabbyn#tabby_} | |
if [[ $llamav == *"$tabbyv"* ]]; then | |
echo "Creating bundle for $llamav" | |
distdir=dist/tabby_$llamav | |
mkdir -p $distdir | |
cp $llama_server $distdir/llama-server | |
cp $tabby $distdir/tabby | |
zip -r $distdir.zip $distdir | |
rm -rf $distdir | |
fi | |
done | |
done | |
- uses: ncipollo/release-action@v1 | |
if: github.event_name == 'push' | |
with: | |
allowUpdates: true | |
prerelease: true | |
artifacts: "dist/tabby_*.zip" | |
tag: ${{ github.ref_name }} | |
removeArtifacts: true |