We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 4045ba8 commit bbb0774Copy full SHA for bbb0774
lmdeploy/pytorch/engine/model_agent.py
@@ -401,6 +401,7 @@ def warmup(self):
401
is_decoding=False,
402
device='cuda',
403
vocab_size=self.model_config.vocab_size)
404
+ inputs.build_dp_meta()
405
self._forward_impl(inputs)
406
407
# warmup decoding(with cuda graph)
@@ -411,6 +412,7 @@ def warmup(self):
411
412
is_decoding=True,
413
414
415
416
417
418
def _slice_outs(self, inputs: torch.Tensor, seq_length: torch.LongTensor):
0 commit comments