fix GenerationMixin ImportError in transformers main branch (#6)

- fix GenerationMixin ImportError in transformers main branch (496bcc3aef55fd057ec943a122be78e0f6c423f3)

Files changed (2) hide show

config.json CHANGED Viewed

@@ -19,7 +19,8 @@
     "merge_kernel_size": [
       2,
       2
-    ]
   },
   "text_config": {
     "vocab_size": 163840,

     "merge_kernel_size": [
       2,
       2
+    ],
+    "torch_dtype": "bfloat16"
   },
   "text_config": {
     "vocab_size": 163840,

modeling_kimi_vl.py CHANGED Viewed

@@ -55,10 +55,8 @@ import torch.distributed as dist
 from torch.nn import CrossEntropyLoss
 from transformers.activations import GELUActivation, ACT2FN, PytorchGELUTanh
 from transformers.cache_utils import Cache, DynamicCache
-from transformers.modeling_utils import (
-    PreTrainedModel,
-    GenerationMixin,
-)
 from transformers.models.llava.modeling_llava import LlavaCausalLMOutputWithPast
 from transformers.modeling_attn_mask_utils import _prepare_4d_causal_attention_mask
 from transformers.modeling_outputs import (

 from torch.nn import CrossEntropyLoss
 from transformers.activations import GELUActivation, ACT2FN, PytorchGELUTanh
 from transformers.cache_utils import Cache, DynamicCache
+from transformers.modeling_utils import PreTrainedModel
+from transformers.generation.utils import GenerationMixin
 from transformers.models.llava.modeling_llava import LlavaCausalLMOutputWithPast
 from transformers.modeling_attn_mask_utils import _prepare_4d_causal_attention_mask
 from transformers.modeling_outputs import (