Skip to content

Commit

Permalink
fix broken llama
Browse files Browse the repository at this point in the history
  • Loading branch information
Ubuntu committed Aug 30, 2024
1 parent 0666697 commit dbf5f67
Show file tree
Hide file tree
Showing 2 changed files with 2 additions and 79 deletions.
77 changes: 0 additions & 77 deletions tts_fish.py

This file was deleted.

4 changes: 2 additions & 2 deletions vllm/worker/model_runner.py
Original file line number Diff line number Diff line change
Expand Up @@ -480,7 +480,7 @@ def _compute_lens(self, inter_data: InterDataForSeqGroup, seq_idx: int,
inter_data.orig_seq_lens[seq_idx] = seq_len
inter_data.context_lens[seq_idx] = context_len

if isinstance(tokens, list) and isinstance(tokens[0], list) == True:
if isinstance(tokens, list) or hasattr(self.runner.model_config.hf_config, "num_output_head"):
inter_data.input_tokens[seq_idx].extend(tokens)
else:
inter_data.input_tokens[seq_idx].append(tokens)
Expand Down Expand Up @@ -699,7 +699,7 @@ def build(self) -> ModelInputForGPU:

# Tokens and positions.
if cuda_graph_pad_size:
if isinstance(input_tokens[0], list):
if hasattr(self.runner.model_config.hf_config, "num_output_head"):
num_head = len(input_tokens[0])
input_tokens.extend(itertools.repeat([0] * num_head, cuda_graph_pad_size))
else:
Expand Down

0 comments on commit dbf5f67

Please sign in to comment.