Skip to content

Commit

Permalink
Update tuner.py
Browse files Browse the repository at this point in the history
  • Loading branch information
hiyouga authored May 11, 2024
1 parent 1049b29 commit 13851fb
Showing 1 changed file with 12 additions and 8 deletions.
20 changes: 12 additions & 8 deletions src/llmtuner/train/tuner.py
Original file line number Diff line number Diff line change
Expand Up @@ -15,9 +15,11 @@
from .rm import run_rm
from .sft import run_sft


if TYPE_CHECKING:
from transformers import TrainerCallback


logger = get_logger(__name__)


Expand Down Expand Up @@ -51,8 +53,8 @@ def export_model(args: Optional[Dict[str, Any]] = None) -> None:
raise ValueError("Please merge adapters before quantizing the model.")

tokenizer_module = load_tokenizer(model_args)
tokenizer = tokenizer_module['tokenizer']
processor = tokenizer_module['processor']
tokenizer = tokenizer_module["tokenizer"]
processor = tokenizer_module["processor"]
get_template_and_fix_tokenizer(tokenizer, data_args.template)
model = load_model(tokenizer, model_args, finetuning_args) # must after fixing tokenizer to resize vocab

Expand All @@ -63,7 +65,7 @@ def export_model(args: Optional[Dict[str, Any]] = None) -> None:
raise ValueError("The model is not a `PreTrainedModel`, export aborted.")

if getattr(model, "quantization_method", None) is None: # cannot convert dtype of a quantized model
output_dtype = getattr(model.config, "torch_dtype", torch.float16)
output_dtype = torch.float16
setattr(model.config, "torch_dtype", output_dtype)
model = model.to(output_dtype)

Expand All @@ -86,10 +88,12 @@ def export_model(args: Optional[Dict[str, Any]] = None) -> None:
tokenizer.save_pretrained(model_args.export_dir)
if model_args.export_hub_model_id is not None:
tokenizer.push_to_hub(model_args.export_hub_model_id, token=model_args.hf_hub_token)

if model_args.visual_inputs and processor is not None:
getattr(processor, "image_processor").save_pretrained(model_args.export_dir)
if model_args.export_hub_model_id is not None:
getattr(processor, "image_processor").push_to_hub(
model_args.export_hub_model_id, token=model_args.hf_hub_token
)
except Exception:
logger.warning("Cannot save tokenizer, please copy the files manually.")

if model_args.visual_inputs:
processor.image_processor.save_pretrained(model_args.export_dir)
if model_args.export_hub_model_id is not None:
processor.image_processor.push_to_hub(model_args.export_hub_model_id, token=model_args.hf_hub_token)

0 comments on commit 13851fb

Please sign in to comment.