You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
logger.info(f"Attempted to get dimensions: num_layers={num_layers}, d_model={d_model}")
53
80
ifnum_layersisNoneord_modelisNone:
54
81
logger.warning(
55
82
f"Could not automatically determine num_layers or d_model for {model_name}. "
@@ -86,7 +113,7 @@ def parse_args():
86
113
"--output-dir",
87
114
type=str,
88
115
default=f"clt_train_{int(time.time())}",
89
-
help="Directory to save logs, checkpoints, and final model. If resuming, this might be overridden by --resume-from-checkpoint-dir.",
116
+
help="Directory to save logs, checkpoints, and final model. If resuming, this might be overridden by --resume_from_checkpoint_dir.",
90
117
)
91
118
core_group.add_argument(
92
119
"--model-name",
@@ -106,16 +133,16 @@ def parse_args():
106
133
help="Enable distributed training (requires torchrun/appropriate launcher).",
107
134
)
108
135
core_group.add_argument(
109
-
"--resume-from-checkpoint-dir",
136
+
"--resume_from_checkpoint_dir",
110
137
type=str,
111
138
default=None,
112
-
help="Path to the output directory of a previous run to resume from. Will attempt to load 'latest' or a specific step if --resume-step is also given.",
139
+
help="Path to the output directory of a previous run to resume from. Will attempt to load 'latest' or a specific step if --resume_step is also given.",
113
140
)
114
141
core_group.add_argument(
115
-
"--resume-step",
142
+
"--resume_step",
116
143
type=int,
117
144
default=None,
118
-
help="Optional specific step to resume from. Used in conjunction with --resume-from-checkpoint-dir.",
145
+
help="Optional specific step to resume from. Used in conjunction with --resume_from_checkpoint_dir.",
0 commit comments