mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-02-04 18:21:52 +08:00
[None][feat] Nemotron H: Eagle3 support (#11131)
Signed-off-by: Izzy Putterman <iputterman@nvidia.com>
This commit is contained in:
parent
cd7762a2fa
commit
3ef8a4639b
@ -361,6 +361,10 @@ class NemotronHLayer(DecoderLayer):
|
||||
spec_metadata=spec_metadata,
|
||||
**kwargs)
|
||||
hidden_states = torch.add(hidden_states, residual)
|
||||
if spec_metadata is not None and spec_metadata.is_layer_capture(
|
||||
self.layer_idx):
|
||||
spec_metadata.maybe_capture_hidden_states(self.layer_idx,
|
||||
hidden_states, None)
|
||||
|
||||
return hidden_states
|
||||
|
||||
|
||||
Loading…
Reference in New Issue
Block a user