We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent b5372e0 commit 48b2093Copy full SHA for 48b2093
lmdeploy/pytorch/engine/model_agent.py
@@ -403,6 +403,7 @@ def warmup(self):
403
is_decoding=False,
404
device='cuda',
405
vocab_size=self.model_config.vocab_size)
406
+ inputs.build_dp_meta()
407
self._forward_impl(inputs, swap_in_map=dict(), swap_out_map=dict())
408
409
# warmup decoding(with cuda graph)
@@ -413,6 +414,7 @@ def warmup(self):
413
414
is_decoding=True,
415
416
417
418
419
420
async def _async_model_forward(
0 commit comments