mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 05:04:58 +08:00
Improve _prune_hidden_states micro-benchmark (#707)
This commit is contained in:
parent
0080d8329d
commit
28873a2799
@ -100,7 +100,8 @@ def _prune_hidden_states(
|
||||
start_idx += prompt_len
|
||||
last_token_indicies.extend(
|
||||
range(start_idx, start_idx + input_metadata.num_generation_tokens))
|
||||
return hidden_states[last_token_indicies]
|
||||
return hidden_states.index_select(
|
||||
0, torch.tensor(last_token_indicies, device=hidden_states.device))
|
||||
|
||||
|
||||
def _get_penalties(
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user