mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 12:35:51 +08:00
[Bugfix] Flush TunableOp results before worker processes are destroyed. (#13623)
Signed-off-by: Nichols A. Romero <nick.romero@amd.com>
This commit is contained in:
parent
75e9d49796
commit
fa82074167
@ -250,6 +250,15 @@ def _run_worker_process(
|
|||||||
except Exception:
|
except Exception:
|
||||||
logger.exception("Worker failed")
|
logger.exception("Worker failed")
|
||||||
|
|
||||||
|
# Flush TunableOp results when TunableOp is enabled and
|
||||||
|
# online (in situ) tuning is enabled.
|
||||||
|
# Offline tuning API (record_untuned_is_enabled()) only
|
||||||
|
# available in PyTorch 2.6 or later.
|
||||||
|
import torch.cuda.tunable as tunable
|
||||||
|
if (tunable.is_enabled() and tunable.tuning_is_enabled()
|
||||||
|
and not tunable.record_untuned_is_enabled()):
|
||||||
|
tunable.write_file()
|
||||||
|
|
||||||
logger.info("Worker exiting")
|
logger.info("Worker exiting")
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user