MK0727
/

lambda-160m

Text Generation

Model card Files Files and versions

MK0727 commited on 4 days ago

Commit

f1635e5

·

verified ·

1 Parent(s): 134df9b

Upload lambda-160m pretrained model

Files changed (1) hide show

modeling_myllm.py +2 -1

modeling_myllm.py CHANGED Viewed

@@ -98,6 +98,7 @@ class MyLLMForCausalLM(PreTrainedModel, GenerationMixin):
     def forward(
         self,
         input_ids: torch.Tensor | None = None,
         labels: torch.Tensor | None = None,
         past_key_values: KeyValueCache | None = None,
         use_cache: bool | None = None,
@@ -108,7 +109,7 @@ class MyLLMForCausalLM(PreTrainedModel, GenerationMixin):
         # Accept the standard AutoModelForCausalLM argument names and
         # delegate the actual tensor computation to the PyTorch model.
         # ---------------------------------------------------------
-        del kwargs
         if input_ids is None:
             raise ValueError("input_ids is required")

     def forward(
         self,
         input_ids: torch.Tensor | None = None,
+        attention_mask: torch.Tensor | None = None,
         labels: torch.Tensor | None = None,
         past_key_values: KeyValueCache | None = None,
         use_cache: bool | None = None,
         # Accept the standard AutoModelForCausalLM argument names and
         # delegate the actual tensor computation to the PyTorch model.
         # ---------------------------------------------------------
+        del attention_mask, kwargs
         if input_ids is None:
             raise ValueError("input_ids is required")