mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-04 10:09:09 +08:00
[Doc] Correct beam_search using in generative_models.md (#14363)
This commit is contained in:
parent
0ddc991f5c
commit
4f27044aab
@ -54,14 +54,16 @@ The {class}`~vllm.LLM.beam_search` method implements [beam search](https://huggi
|
|||||||
For example, to search using 5 beams and output at most 50 tokens:
|
For example, to search using 5 beams and output at most 50 tokens:
|
||||||
|
|
||||||
```python
|
```python
|
||||||
|
from vllm import LLM
|
||||||
|
from vllm.sampling_params import BeamSearchParams
|
||||||
|
|
||||||
llm = LLM(model="facebook/opt-125m")
|
llm = LLM(model="facebook/opt-125m")
|
||||||
params = BeamSearchParams(beam_width=5, max_tokens=50)
|
params = BeamSearchParams(beam_width=5, max_tokens=50)
|
||||||
outputs = llm.generate("Hello, my name is", params)
|
outputs = llm.beam_search([{"prompt": "Hello, my name is "}], params)
|
||||||
|
|
||||||
for output in outputs:
|
for output in outputs:
|
||||||
prompt = output.prompt
|
generated_text = output.sequences[0].text
|
||||||
generated_text = output.outputs[0].text
|
print(f"Generated text: {generated_text!r}")
|
||||||
print(f"Prompt: {prompt!r}, Generated text: {generated_text!r}")
|
|
||||||
```
|
```
|
||||||
|
|
||||||
### `LLM.chat`
|
### `LLM.chat`
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user