mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 01:05:01 +08:00
[Doc] Remove Useless Comments (#24687)
Signed-off-by: yewentao256 <zhyanwentao@126.com>
This commit is contained in:
parent
127ded0a9e
commit
a892b259b4
@ -757,10 +757,9 @@ class Fp8MoEMethod(FusedMoEMethodBase):
|
|||||||
layer.w2_weight = torch.nn.Parameter(shuffled_w2,
|
layer.w2_weight = torch.nn.Parameter(shuffled_w2,
|
||||||
requires_grad=False)
|
requires_grad=False)
|
||||||
|
|
||||||
# DeepGemm scales need to be transposed and aligned. We try to do
|
# DeepGemm scales need to be transposed and aligned. We try to do
|
||||||
# it ahead of time for performance reasons.
|
# it ahead of time for performance reasons.
|
||||||
if self.allow_deep_gemm and not is_deep_gemm_e8m0_used():
|
if self.allow_deep_gemm and not is_deep_gemm_e8m0_used():
|
||||||
# Lazy import to avoid CUDA initialization problems.
|
|
||||||
if _is_col_major(layer.w13_weight_scale_inv):
|
if _is_col_major(layer.w13_weight_scale_inv):
|
||||||
layer.w13_weight_scale_inv = \
|
layer.w13_weight_scale_inv = \
|
||||||
get_col_major_tma_aligned_tensor(layer.w13_weight_scale_inv).contiguous()
|
get_col_major_tma_aligned_tensor(layer.w13_weight_scale_inv).contiguous()
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user