[compile] Recompile graph module during Dynamo cache loading. (#30743)

Signed-off-by: Zhengxu Chen <zhxchen17@fb.com>
This commit is contained in:
Zhengxu Chen 2025-12-17 05:00:12 -05:00 committed by GitHub
parent 7b966ae2ba
commit 53cd7f868b
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -104,6 +104,7 @@ class VllmSerializableFunction(SerializableCallable):
state = pickle.loads(data)
fake_mode = FakeTensorMode(shape_env=ShapeEnv())
state["graph_module"] = GraphPickler.loads(state["graph_module"], fake_mode)
state["graph_module"].recompile()
state["example_inputs"] = GraphPickler.loads(state["example_inputs"], fake_mode)
vllm_backend = VllmBackend(get_current_vllm_config(), state["prefix"])