Skip to content

Commit

Permalink
support auto hsdp
Browse files Browse the repository at this point in the history
  • Loading branch information
blahBlahhhJ committed Nov 14, 2024
1 parent 433490e commit 3bcac0a
Showing 1 changed file with 4 additions and 0 deletions.
4 changes: 4 additions & 0 deletions src/levanter/trainer.py
Original file line number Diff line number Diff line change
Expand Up @@ -766,6 +766,10 @@ def _validate_and_set_defaults(self):
if self.per_device_eval_parallelism == -1:
self.per_device_eval_parallelism = self.per_device_parallelism

if self.replica_dcn_axis_size == -1:
self.replica_dcn_axis_size = self.num_slices
logger.info(f"Setting replica_dcn_axis_size to {self.replica_dcn_axis_size}")


class AllConfig(Protocol):
trainer: TrainerConfig
Expand Down

0 comments on commit 3bcac0a

Please sign in to comment.