diff --git a/src/nanotron/trainer.py b/src/nanotron/trainer.py index 04d89cf4..62986fba 100644 --- a/src/nanotron/trainer.py +++ b/src/nanotron/trainer.py @@ -621,12 +621,12 @@ def train_step_logs( lr = self.lr_scheduler.get_last_lr()[0] log_entries = [ - # LogItem("consumed_samples", self.consumed_train_samples, "human_format"), # , "12d"), - # LogItem( - # "consumed_tokens", - # self.metadata.consumed_train_samples * self.config.tokens.sequence_length, - # "human_format", - # ), # , "12d"), + # LogItem("consumed_samples", self.metadata.consumed_train_samples, "human_format"), # , "12d"), + LogItem( + "consumed_tokens", + self.metadata.consumed_train_samples * self.config.tokens.sequence_length, + "human_format", + ), # , "12d"), LogItem("elapsed_time_per_iteration_ms", elapsed_time_per_iteration_ms, "human_format"), # , ".1f"), LogItem("tokens_per_sec", tokens_per_sec, "human_format"), # , "1.6E"), LogItem(