mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-16 17:22:23 +08:00
refactor example - qwen3_reranker (#19847)
Signed-off-by: reidliu41 <reid201711@gmail.com> Co-authored-by: reidliu41 <reid201711@gmail.com>
This commit is contained in:
parent
53da4cd397
commit
26d34eb67e
@ -22,15 +22,19 @@ model_name = "Qwen/Qwen3-Reranker-0.6B"
|
|||||||
# If you want to load the official original version, the init parameters are
|
# If you want to load the official original version, the init parameters are
|
||||||
# as follows.
|
# as follows.
|
||||||
|
|
||||||
model = LLM(
|
|
||||||
model=model_name,
|
def get_model() -> LLM:
|
||||||
task="score",
|
"""Initializes and returns the LLM model for Qwen3-Reranker."""
|
||||||
hf_overrides={
|
return LLM(
|
||||||
"architectures": ["Qwen3ForSequenceClassification"],
|
model=model_name,
|
||||||
"classifier_from_token": ["no", "yes"],
|
task="score",
|
||||||
"is_original_qwen3_reranker": True,
|
hf_overrides={
|
||||||
},
|
"architectures": ["Qwen3ForSequenceClassification"],
|
||||||
)
|
"classifier_from_token": ["no", "yes"],
|
||||||
|
"is_original_qwen3_reranker": True,
|
||||||
|
},
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
# Why do we need hf_overrides for the official original version:
|
# Why do we need hf_overrides for the official original version:
|
||||||
# vllm converts it to Qwen3ForSequenceClassification when loaded for
|
# vllm converts it to Qwen3ForSequenceClassification when loaded for
|
||||||
@ -51,7 +55,8 @@ suffix = "<|im_end|>\n<|im_start|>assistant\n<think>\n\n</think>\n\n"
|
|||||||
query_template = "{prefix}<Instruct>: {instruction}\n<Query>: {query}\n"
|
query_template = "{prefix}<Instruct>: {instruction}\n<Query>: {query}\n"
|
||||||
document_template = "<Document>: {doc}{suffix}"
|
document_template = "<Document>: {doc}{suffix}"
|
||||||
|
|
||||||
if __name__ == "__main__":
|
|
||||||
|
def main() -> None:
|
||||||
instruction = (
|
instruction = (
|
||||||
"Given a web search query, retrieve relevant passages that answer the query"
|
"Given a web search query, retrieve relevant passages that answer the query"
|
||||||
)
|
)
|
||||||
@ -72,6 +77,13 @@ if __name__ == "__main__":
|
|||||||
]
|
]
|
||||||
documents = [document_template.format(doc=doc, suffix=suffix) for doc in documents]
|
documents = [document_template.format(doc=doc, suffix=suffix) for doc in documents]
|
||||||
|
|
||||||
|
model = get_model()
|
||||||
outputs = model.score(queries, documents)
|
outputs = model.score(queries, documents)
|
||||||
|
|
||||||
|
print("-" * 30)
|
||||||
print([output.outputs.score for output in outputs])
|
print([output.outputs.score for output in outputs])
|
||||||
|
print("-" * 30)
|
||||||
|
|
||||||
|
|
||||||
|
if __name__ == "__main__":
|
||||||
|
main()
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user