diff --git a/src/levanter/main/train_lm.py b/src/levanter/main/train_lm.py index 3fb1c6afa..a827ae46b 100644 --- a/src/levanter/main/train_lm.py +++ b/src/levanter/main/train_lm.py @@ -170,7 +170,7 @@ def main(config: TrainLmConfig): every=config.hf_save_steps, ) - trainer.add_hook(callbacks.GradWatchCallback(include_histogram=True), every=5) + # trainer.add_hook(callbacks.GradWatchCallback(include_histogram=True), every=5) state = trainer.initial_state(training_key, model_init=lambda: config.model.build(Vocab, key=model_key))