From 6092128125ad34f672f94e06f9b2b01722dacfc4 Mon Sep 17 00:00:00 2001 From: Jon Perry Date: Fri, 26 Jul 2024 14:00:30 -0400 Subject: [PATCH] fix: vllm e2e dependencies and env_vars --- .github/workflows/e2e-vllm.yaml | 1 + packages/vllm/zarf.yaml | 3 +++ 2 files changed, 4 insertions(+) diff --git a/.github/workflows/e2e-vllm.yaml b/.github/workflows/e2e-vllm.yaml index 3f95965f22..84f4ccd15e 100644 --- a/.github/workflows/e2e-vllm.yaml +++ b/.github/workflows/e2e-vllm.yaml @@ -69,6 +69,7 @@ jobs: run: | python -m pip install "." python -m pip install -U "huggingface_hub[cli,hf_transfer]" + python -m pip install confz - name: Setup UDS Environment uses: defenseunicorns/uds-common/.github/actions/setup@05f42bb3117b66ebef8c72ae050b34bce19385f5 diff --git a/packages/vllm/zarf.yaml b/packages/vllm/zarf.yaml index 9a2e16a257..f86b2614cb 100644 --- a/packages/vllm/zarf.yaml +++ b/packages/vllm/zarf.yaml @@ -25,6 +25,7 @@ components: - "vllm-values.yaml" images: - ghcr.io/defenseunicorns/leapfrogai/vllm:###ZARF_PKG_TMPL_IMAGE_VERSION### + - cgr.dev/chainguard/bash:latest dataInjections: - source: .model/ target: @@ -41,3 +42,5 @@ components: env: - LAI_REPO_ID=TheBloke/Synthia-7B-v2.0-GPTQ - LAI_REVISION=gptq-4bit-32g-actorder_True + - LAI_QUANTIZATION=gptq + - LAI_HF_HUB_ENABLE_HF_TRANSFER=1