Skip to content

Commit

Permalink
use ray
Browse files Browse the repository at this point in the history
  • Loading branch information
IlyasMoutawwakil committed Sep 21, 2024
1 parent 192adfe commit 3f820de
Show file tree
Hide file tree
Showing 5 changed files with 4 additions and 8 deletions.
4 changes: 2 additions & 2 deletions .github/workflows/test_cli_cuda_vllm.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -47,7 +47,7 @@ jobs:
- name: Run tests
run: |
pytest -x -s -k "cli and cuda and vllm and not tp"
FORCE_SERIAL=1 pytest -x -s -k "cli and cuda and vllm and not tp"
run_cli_cuda_vllm_multi_gpu_tests:
if: ${{
Expand Down Expand Up @@ -76,4 +76,4 @@ jobs:
- name: Run tests
run: |
pytest -x -s -k "cli and cuda and vllm and tp"
FORCE_SERIAL=1 pytest -x -s -k "cli and cuda and vllm and tp"
3 changes: 0 additions & 3 deletions tests/configs/_memory_utilization_.yaml

This file was deleted.

3 changes: 2 additions & 1 deletion tests/configs/_tp_.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,8 @@ backend:
device_ids: 0,1
engine_args:
tensor_parallel_size: 2
distributed_executor_backend: mp
disable_custom_all_reduce: true
distributed_executor_backend: ray

# hydra/cli specific settings
hydra:
Expand Down
1 change: 0 additions & 1 deletion tests/configs/cuda_inference_vllm_bloom.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,6 @@ defaults:
- _base_ # inherits from base config
- _cuda_ # inherits from cuda config
- _inference_ # inherits from inference config
- _memory_utilization_ # inherits from memory utilization config
- _serving_mode_ # inherits from serving_mode config
- _no_weights_ # inherits from no weights config
- _bloom_ # inherits from bloom config
Expand Down
1 change: 0 additions & 1 deletion tests/configs/cuda_inference_vllm_bloom_tp.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,6 @@ defaults:
- _base_ # inherits from base config
- _cuda_ # inherits from cuda config
- _inference_ # inherits from inference config
- _memory_utilization_ # inherits from memory utilization config
- _serving_mode_ # inherits from serving_mode config
- _no_weights_ # inherits from no weights config
- _bloom_ # inherits from bloom config
Expand Down

0 comments on commit 3f820de

Please sign in to comment.