File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -145,6 +145,7 @@ diffusion_scheduler_config: {
145145# Output directory
146146# Create a GCS bucket, e.g. my-maxtext-outputs and set this to "gs://my-maxtext-outputs/"
147147base_output_directory : " "
148+ tensorboard_dir : " "
148149
149150# Hardware
150151hardware : ' tpu' # Supported hardware types are 'tpu', 'gpu'
@@ -300,7 +301,7 @@ save_optimizer: False
300301adam_b1 : 0.9 # Exponential decay rate to track the first moment of past gradients.
301302adam_b2 : 0.999 # Exponential decay rate to track the second moment of past gradients.
302303adam_eps : 1.e-8 # A small constant applied to denominator outside of the square root.
303- adam_weight_decay : 0 # AdamW Weight decay
304+ adam_weight_decay : 0.0 # AdamW Weight decay
304305max_grad_norm : 1.0
305306
306307enable_profiler : False
Original file line number Diff line number Diff line change @@ -122,6 +122,7 @@ diffusion_scheduler_config: {
122122# Output directory
123123# Create a GCS bucket, e.g. my-maxtext-outputs and set this to "gs://my-maxtext-outputs/"
124124base_output_directory : " "
125+ tensorboard_dir : " "
125126
126127# Hardware
127128hardware : ' tpu' # Supported hardware types are 'tpu', 'gpu'
@@ -256,7 +257,7 @@ save_optimizer: False
256257adam_b1 : 0.9 # Exponential decay rate to track the first moment of past gradients.
257258adam_b2 : 0.999 # Exponential decay rate to track the second moment of past gradients.
258259adam_eps : 1.e-8 # A small constant applied to denominator outside of the square root.
259- adam_weight_decay : 0 # AdamW Weight decay
260+ adam_weight_decay : 0.0 # AdamW Weight decay
260261max_grad_norm : 1.0
261262
262263enable_profiler : False
Original file line number Diff line number Diff line change @@ -133,6 +133,7 @@ diffusion_scheduler_config: {
133133# Output directory
134134# Create a GCS bucket, e.g. my-maxtext-outputs and set this to "gs://my-maxtext-outputs/"
135135base_output_directory : " "
136+ tensorboard_dir : " "
136137
137138# Hardware
138139hardware : ' tpu' # Supported hardware types are 'tpu', 'gpu'
@@ -267,7 +268,7 @@ save_optimizer: False
267268adam_b1 : 0.9 # Exponential decay rate to track the first moment of past gradients.
268269adam_b2 : 0.999 # Exponential decay rate to track the second moment of past gradients.
269270adam_eps : 1.e-8 # A small constant applied to denominator outside of the square root.
270- adam_weight_decay : 0 # AdamW Weight decay
271+ adam_weight_decay : 0.0 # AdamW Weight decay
271272max_grad_norm : 1.0
272273
273274enable_profiler : False
Original file line number Diff line number Diff line change @@ -128,6 +128,7 @@ diffusion_scheduler_config: {
128128# Output directory
129129# Create a GCS bucket, e.g. my-maxtext-outputs and set this to "gs://my-maxtext-outputs/"
130130base_output_directory : " "
131+ tensorboard_dir : " "
131132
132133# Hardware
133134hardware : ' tpu' # Supported hardware types are 'tpu', 'gpu'
@@ -262,7 +263,7 @@ save_optimizer: False
262263adam_b1 : 0.9 # Exponential decay rate to track the first moment of past gradients.
263264adam_b2 : 0.999 # Exponential decay rate to track the second moment of past gradients.
264265adam_eps : 1.e-8 # A small constant applied to denominator outside of the square root.
265- adam_weight_decay : 0 # AdamW Weight decay
266+ adam_weight_decay : 0.0 # AdamW Weight decay
266267max_grad_norm : 1.0
267268
268269enable_profiler : False
Original file line number Diff line number Diff line change @@ -129,6 +129,7 @@ diffusion_scheduler_config: {
129129# Output directory
130130# Create a GCS bucket, e.g. my-maxtext-outputs and set this to "gs://my-maxtext-outputs/"
131131base_output_directory : " "
132+ tensorboard_dir : " "
132133
133134# Hardware
134135hardware : ' tpu' # Supported hardware types are 'tpu', 'gpu'
@@ -263,7 +264,7 @@ save_optimizer: False
263264adam_b1 : 0.9 # Exponential decay rate to track the first moment of past gradients.
264265adam_b2 : 0.999 # Exponential decay rate to track the second moment of past gradients.
265266adam_eps : 1.e-8 # A small constant applied to denominator outside of the square root.
266- adam_weight_decay : 0 # AdamW Weight decay
267+ adam_weight_decay : 0.0 # AdamW Weight decay
267268max_grad_norm : 1.0
268269
269270enable_profiler : False
You can’t perform that action at this time.
0 commit comments