ErazerControl
/

Phi-4-mini-instruct

Text Generation

text-generation-inference

Model card Files Files and versions

ErazerControl commited on Aug 28

Commit

fa87fe3

·

verified ·

1 Parent(s): 296867d

Update modeling_phi3.py

Files changed (1) hide show

modeling_phi3.py +1 -2

modeling_phi3.py CHANGED Viewed

@@ -35,7 +35,6 @@ from transformers.modeling_rope_utils import ROPE_INIT_FUNCTIONS
 from transformers.modeling_utils import ALL_ATTENTION_FUNCTIONS, PreTrainedModel
 from transformers.processing_utils import Unpack
 from transformers.utils import (
-    LossKwargs,
     add_code_sample_docstrings,
     add_start_docstrings,
     add_start_docstrings_to_model_forward,
@@ -817,7 +816,7 @@ class Phi3Model(Phi3PreTrainedModel):
         return causal_mask
-class KwargsForCausalLM(FlashAttentionKwargs, LossKwargs): ...
 class Phi3ForCausalLM(Phi3PreTrainedModel, GenerationMixin):

 from transformers.modeling_utils import ALL_ATTENTION_FUNCTIONS, PreTrainedModel
 from transformers.processing_utils import Unpack
 from transformers.utils import (
     add_code_sample_docstrings,
     add_start_docstrings,
     add_start_docstrings_to_model_forward,
         return causal_mask
+class KwargsForCausalLM(FlashAttentionKwargs): ...
 class Phi3ForCausalLM(Phi3PreTrainedModel, GenerationMixin):