Skip to content

Commit

Permalink
Merge pull request #14 from TianyiQ/main
Browse files Browse the repository at this point in the history
fix(evaluation): allow manual spec of tensor parallelization
  • Loading branch information
TianyiQ authored Nov 16, 2024
2 parents a6a0448 + 2ee86f8 commit c283c3c
Showing 1 changed file with 4 additions and 0 deletions.
4 changes: 4 additions & 0 deletions src/abstractions/backends.py
Original file line number Diff line number Diff line change
Expand Up @@ -344,6 +344,10 @@ def vllm_process_batch(
min_gpus_per_instance = (
2 if model_size <= 30 else 4 if model_size <= 80 else 8
)

if os.environ.get("FORCE_TP"):
min_gpus_per_instance = int(os.environ.get("FORCE_TP"))

assert num_gpus % min_gpus_per_instance == 0
args = [
"python",
Expand Down

0 comments on commit c283c3c

Please sign in to comment.