Upload files with `vila-upload`.
Browse files- modeling_vila.py +2 -3
modeling_vila.py
CHANGED
@@ -350,7 +350,7 @@ class VILAPretrainedModel(PreTrainedModel):
|
|
350 |
os.symlink(full_file_name, os.path.join(output_dir, file_name))
|
351 |
print("[HF remote code] linking", full_file_name, "to", output_dir)
|
352 |
|
353 |
-
def save_pretrained(self, output_dir, state_dict=None):
|
354 |
if state_dict is None:
|
355 |
# other wise fetch from deepspeed
|
356 |
# state_dict = accelerator.get_state_dict(is_deepspeed_enabled)
|
@@ -590,12 +590,11 @@ class VILAForCasualLM(VILAPretrainedModel):
|
|
590 |
|
591 |
def train(self, mode: bool = True):
|
592 |
if mode:
|
593 |
-
print(f"Set padding side to right for training, {mode=}")
|
594 |
self.tokenizer.padding_side = "right"
|
595 |
else:
|
596 |
-
print(f"Set padding side to left for evaluation, {mode=}")
|
597 |
self.tokenizer.padding_side = "left"
|
598 |
super().train(mode)
|
|
|
599 |
|
600 |
def _embed(
|
601 |
self,
|
|
|
350 |
os.symlink(full_file_name, os.path.join(output_dir, file_name))
|
351 |
print("[HF remote code] linking", full_file_name, "to", output_dir)
|
352 |
|
353 |
+
def save_pretrained(self, output_dir, state_dict=None, **kwargs):
|
354 |
if state_dict is None:
|
355 |
# other wise fetch from deepspeed
|
356 |
# state_dict = accelerator.get_state_dict(is_deepspeed_enabled)
|
|
|
590 |
|
591 |
def train(self, mode: bool = True):
|
592 |
if mode:
|
|
|
593 |
self.tokenizer.padding_side = "right"
|
594 |
else:
|
|
|
595 |
self.tokenizer.padding_side = "left"
|
596 |
super().train(mode)
|
597 |
+
return self
|
598 |
|
599 |
def _embed(
|
600 |
self,
|