@@ -113,8 +113,7 @@ class LagLlamaLightningModule(LightningModule):
defforward(self,*args,**kwargs):
"""
Self-speculative decoding for continuous distributions where model predicts
distribution parameters for multiple future steps.
multi-step ancestral sampling, for each time step predict the next n_predictions - 1 steps and then continue for time step n_predictions till prediction_length