lirannoc commited on
Commit
868b7c0
·
verified ·
1 Parent(s): 628d649

Update modeling_super_linear.py

Browse files
Files changed (1) hide show
  1. modeling_super_linear.py +2 -3
modeling_super_linear.py CHANGED
@@ -561,7 +561,6 @@ class SuperLinearForCausalLM(PreTrainedModel, GenerationMixin):
561
 
562
  def forward(self,
563
  inputs_embeds: torch.Tensor = None,
564
- prediction_len: int = None,
565
  attention_mask: Optional[torch.Tensor] = None,
566
  past_key_values: Optional[Tuple] = None,
567
  use_cache: bool = True,
@@ -577,11 +576,11 @@ class SuperLinearForCausalLM(PreTrainedModel, GenerationMixin):
577
  return CausalLMOutputWithCrossAttentions(loss=None,logits=preds,past_key_values=None,hidden_states=None,attentions=None,)
578
 
579
 
580
- def prepare_inputs_for_generation(self, inputs_embeds, past_key_values=None, prediction_len=None, **kwargs):
581
  if past_key_values is not None:
582
  # only feed the last new step
583
  inputs_embeds = inputs_embeds[:, -1:, :]
584
- return {"inputs_embeds": inputs_embeds, "past_key_values": past_key_values, "prediction_len": prediction_len}
585
 
586
  def _reorder_cache(self, past, beam_idx, **kwargs):
587
  return past # backbone keeps no KV cache
 
561
 
562
  def forward(self,
563
  inputs_embeds: torch.Tensor = None,
 
564
  attention_mask: Optional[torch.Tensor] = None,
565
  past_key_values: Optional[Tuple] = None,
566
  use_cache: bool = True,
 
576
  return CausalLMOutputWithCrossAttentions(loss=None,logits=preds,past_key_values=None,hidden_states=None,attentions=None,)
577
 
578
 
579
+ def prepare_inputs_for_generation(self, inputs_embeds, past_key_values=None, **kwargs):
580
  if past_key_values is not None:
581
  # only feed the last new step
582
  inputs_embeds = inputs_embeds[:, -1:, :]
583
+ return {"inputs_embeds": inputs_embeds, "past_key_values": past_key_values}
584
 
585
  def _reorder_cache(self, past, beam_idx, **kwargs):
586
  return past # backbone keeps no KV cache