-
Notifications
You must be signed in to change notification settings - Fork 24
43 lines (39 loc) · 1.62 KB
/
test-pytorch-xla-tpu-tgi.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
name: Optimum TPU / Test TGI on TPU
on:
push:
branches: [ testcipauline ]
#paths:
# - "text-generation-inference/**"
#pull_request:
#branches: [ main ]
#paths:
#- "text-generation-inference/**"
concurrency:
group: ${{ github.workflow }}-${{ github.head_ref || github.run_id }}
cancel-in-progress: true
jobs:
do-the-job:
name: Run TGI tests
runs-on: tpu-runner-solo
#container:
# Use an image that works with TPU with Pytorch 2.3.0 (release was not working)
#image: us-central1-docker.pkg.dev/tpu-pytorch-releases/docker/xla@sha256:8f1dcd5b03f993e4da5c20d17c77aff6a5f22d5455f8eb042d2e4b16ac460526
#options: --shm-size "16gb" --ipc host --privileged
env:
PJRT_DEVICE: TPU
steps:
#- name: Checkout
#uses: actions/checkout@v4
- name: slepp
run: |
pip install 'jax[tpu]' -f https://storage.googleapis.com/jax-releases/libtpu_releases.html
pip install --upgrade pip
python -c 'import jax; print("TPU cores:", jax.device_count())'
python -c "import torch_xla.core.xla_model as xm; assert xm.xla_device().type == 'xla', 'XLA device not available'"
#- name: Install dependencies
# run: pip install torch~=2.2.0 torch_xla[tpu]~=2.2.0 -f https://storage.googleapis.com/libtpu-releases/index.html
#- name: Checking Pytorch/XLA installation
# run: python -c "import torch_xla.core.xla_model as xm; assert xm.xla_device().type == 'xla', 'XLA device not available'"
#- name: Build and test TGI server
# run: |
# HF_TOKEN=${{ secrets.HF_TOKEN_OPTIMUM_TPU_CI }} make tgi_test