mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-04-27 17:17:06 +08:00
Remove tpu_int8 as it is related to deleted quantization config and implementation
Signed-off-by: Wei-Yu Lin <weiyulin@google.com>
This commit is contained in:
parent
49bef08e13
commit
df62da8da2
@ -11,7 +11,6 @@ logger = init_logger(__name__)
|
|||||||
QuantizationMethods = Literal[
|
QuantizationMethods = Literal[
|
||||||
"awq",
|
"awq",
|
||||||
"deepspeedfp",
|
"deepspeedfp",
|
||||||
"tpu_int8",
|
|
||||||
"fp8",
|
"fp8",
|
||||||
"ptpc_fp8",
|
"ptpc_fp8",
|
||||||
"fbgemm_fp8",
|
"fbgemm_fp8",
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user