Skip to content

Commit

Permalink
Merge branch 'inference' into broadcast_shapes
Browse files Browse the repository at this point in the history
  • Loading branch information
soumyac1999 authored Nov 3, 2023
2 parents 575cc2a + 1105f4e commit b37faaa
Show file tree
Hide file tree
Showing 34 changed files with 1,667 additions and 1,996 deletions.
75 changes: 75 additions & 0 deletions .github/workflows/helpers/prebuild_legion.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,75 @@
#! /usr/bin/env bash
set -euo pipefail

# Parse input params
python_version=${python_version:-"empty"}
gpu_backend=${gpu_backend:-"empty"}
gpu_backend_version=${gpu_backend_version:-"empty"}

if [[ "${gpu_backend}" != @(cuda|hip_cuda|hip_rocm|intel) ]]; then
echo "Error, value of gpu_backend (${gpu_backend}) is invalid. Pick between 'cuda', 'hip_cuda', 'hip_rocm' or 'intel'."
exit 1
else
echo "Pre-building Legion with GPU backend: ${gpu_backend}"
fi

if [[ "${gpu_backend}" == "cuda" || "${gpu_backend}" == "hip_cuda" ]]; then
# Check that CUDA version is supported. Versions above 12.0 not supported because we don't publish docker images for it yet.
if [[ "$gpu_backend_version" != @(11.1|11.2|11.3|11.4|11.5|11.6|11.7|11.8|12.0) ]]; then
echo "cuda_version is not supported, please choose among {11.1|11.2|11.3|11.4|11.5|11.6|11.7|11.8|12.0}"
exit 1
fi
export cuda_version="$gpu_backend_version"
elif [[ "${gpu_backend}" == "hip_rocm" ]]; then
# Check that HIP version is supported
if [[ "$gpu_backend_version" != @(5.3|5.4|5.5|5.6) ]]; then
echo "hip_version is not supported, please choose among {5.3, 5.4, 5.5, 5.6}"
exit 1
fi
export hip_version="$gpu_backend_version"
else
echo "gpu backend: ${gpu_backend} and gpu_backend_version: ${gpu_backend_version} not yet supported."
exit 1
fi

# Cd into directory holding this script
cd "${BASH_SOURCE[0]%/*}"

export FF_GPU_BACKEND="${gpu_backend}"
export FF_CUDA_ARCH=all
export FF_HIP_ARCH=all
export BUILD_LEGION_ONLY=ON
export INSTALL_DIR="/usr/legion"
export python_version="${python_version}"

# Build Docker Flexflow Container
echo "building docker"
../../../docker/build.sh flexflow

# Cleanup any existing container with the same name
docker rm prelegion || true

# Create container to be able to copy data from the image
docker create --name prelegion flexflow-"${gpu_backend}"-"${gpu_backend_version}":latest

# Copy legion libraries to host
echo "extract legion library assets"
mkdir -p ../../../prebuilt_legion_assets
rm -rf ../../../prebuilt_legion_assets/tmp || true
docker cp prelegion:$INSTALL_DIR ../../../prebuilt_legion_assets/tmp


# Create the tarball file
cd ../../../prebuilt_legion_assets/tmp
export LEGION_TARBALL="legion_ubuntu-20.04_${gpu_backend}-${gpu_backend_version}_py${python_version}.tar.gz"

echo "Creating archive $LEGION_TARBALL"
tar -zcvf "../$LEGION_TARBALL" ./
cd ..
echo "Checking the size of the Legion tarball..."
du -h "$LEGION_TARBALL"


# Cleanup
rm -rf tmp/*
docker rm prelegion
84 changes: 84 additions & 0 deletions .github/workflows/prebuild-legion.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,84 @@
name: "prebuild-legion"
on:
push:
branches:
- "inference"
paths:
- "cmake/**"
- "config/**"
- "deps/legion/**"
- ".github/workflows/helpers/install_dependencies.sh"
workflow_dispatch:
concurrency:
group: prebuild-legion-${{ github.head_ref || github.run_id }}
cancel-in-progress: true

jobs:
prebuild-legion:
name: Prebuild Legion with CMake
runs-on: ubuntu-20.04
defaults:
run:
shell: bash -l {0} # required to use an activated conda environment
strategy:
matrix:
gpu_backend: ["cuda", "hip_rocm"]
gpu_backend_version: ["11.8", "5.6"]
python_version: ["3.11"]
exclude:
- gpu_backend: "cuda"
gpu_backend_version: "5.6"
- gpu_backend: "hip_rocm"
gpu_backend_version: "11.8"
fail-fast: false
steps:
- name: Checkout Git Repository
uses: actions/checkout@v3
with:
submodules: recursive

- name: Free additional space on runner
run: .github/workflows/helpers/free_space_on_runner.sh

- name: Build Legion
env:
gpu_backend: ${{ matrix.gpu_backend }}
gpu_backend_version: ${{ matrix.gpu_backend_version }}
python_version: ${{ matrix.python_version }}
run: .github/workflows/helpers/prebuild_legion.sh

- name: Archive compiled Legion library (CUDA)
uses: actions/upload-artifact@v3
with:
name: legion_ubuntu-20.04_${{ matrix.gpu_backend }}-${{ matrix.gpu_backend_version }}_py${{ matrix.python_version }}
path: prebuilt_legion_assets/legion_ubuntu-20.04_${{ matrix.gpu_backend }}-${{ matrix.gpu_backend_version }}_py${{ matrix.python_version }}.tar.gz

create-release:
name: Create new release
runs-on: ubuntu-20.04
needs: prebuild-legion
steps:
- name: Checkout Git Repository
uses: actions/checkout@v3
- name: Free additional space on runner
run: .github/workflows/helpers/free_space_on_runner.sh
- name: Create folder for artifacts
run: mkdir artifacts unwrapped_artifacts
- name: Download artifacts
uses: actions/download-artifact@v3
with:
path: ./artifacts
- name: Display structure of downloaded files
working-directory: ./artifacts
run: ls -R
- name: Unwrap all artifacts
working-directory: ./artifacts
run: find . -maxdepth 2 -mindepth 2 -type f -name "*.tar.gz" -exec mv {} ../unwrapped_artifacts/ \;
- name: Get datetime
run: echo "RELEASE_DATETIME=$(date '+%Y-%m-%dT%H-%M-%S')" >> $GITHUB_ENV
- name: Release
env:
NAME: ${{ env.RELEASE_DATETIME }}
TAG_NAME: ${{ env.RELEASE_DATETIME }}
GITHUB_TOKEN: ${{ secrets.FLEXFLOW_TOKEN }}
run: gh release create $TAG_NAME ./unwrapped_artifacts/*.tar.gz --repo flexflow/flexflow-third-party
Loading

0 comments on commit b37faaa

Please sign in to comment.