diff --git a/.github/workflows/test-pytorch-xla-tpu-tgi-integration.yml b/.github/workflows/test-pytorch-xla-tpu-tgi-integration.yml index af30bc36..b4a99c07 100644 --- a/.github/workflows/test-pytorch-xla-tpu-tgi-integration.yml +++ b/.github/workflows/test-pytorch-xla-tpu-tgi-integration.yml @@ -18,10 +18,6 @@ jobs: runs-on: group: gcp-ct5lp-hightpu-8t - container: - image: us-central1-docker.pkg.dev/tpu-pytorch-releases/docker/xla:r2.4.0_3.10_tpuvm - options: --shm-size "16gb" --ipc host --privileged ${{ vars.V5_LITEPOD_8_ENV}} --network test-network -v /mnt/hf_cache:/mnt/hf_cache -e PJRT_DEVICE=TPU - env: PJRT_DEVICE: TPU HF_HUB_CACHE: /mnt/hf_cache/cache_huggingface @@ -49,7 +45,6 @@ jobs: run: | # Start docker container in background docker run -d --name tgi-tests-gpt2 \ - --network test-network \ -e LOG_LEVEL=info,text_generation_router,text_generation_launcher=debug \ -e HF_HUB_ENABLE_HF_TRANSFER=0 \ -e MAX_BATCH_SIZE=4 \