Skip to content

Commit

Permalink
added check pointing fields
Browse files Browse the repository at this point in the history
  • Loading branch information
karajendran committed Sep 19, 2024
1 parent 2853bf9 commit cb52fdc
Showing 1 changed file with 9 additions and 1 deletion.
Original file line number Diff line number Diff line change
Expand Up @@ -252,8 +252,14 @@ def get_current_node_id_and_rank():
# Saves memory and speeds up training considerably
group_by_length = True

# Checkpoint save strategy
save_strategy = "steps"

# Save checkpoint every X updates steps
save_steps = 0
save_steps = 1

# Total number of checkpoints kept
save_total_limit = 5

# Log every X updates steps
logging_steps = 50
Expand Down Expand Up @@ -324,7 +330,9 @@ def get_current_node_id_and_rank():
output_dir=save_model_path,
packing=packing,
per_device_train_batch_size=per_device_train_batch_size,
save_strategy=save_strategy,
save_steps=save_steps,
save_total_limit=save_total_limit,
warmup_ratio=warmup_ratio,
weight_decay=weight_decay,
)
Expand Down

0 comments on commit cb52fdc

Please sign in to comment.