Skip to content

Commit

Permalink
Latest changes
Browse files Browse the repository at this point in the history
  • Loading branch information
SujeethJinesh committed Dec 5, 2024
1 parent a75d084 commit 4f321d7
Show file tree
Hide file tree
Showing 2 changed files with 3 additions and 2 deletions.
2 changes: 1 addition & 1 deletion MaxText/configs/base.yml
Original file line number Diff line number Diff line change
Expand Up @@ -467,7 +467,7 @@ enable_jax_profiler: False
jax_profiler_port: 9999

# Checkpoint Structured logging
enable_checkpoint_cloud_logger: False
enable_checkpoint_cloud_logger: True

# Single-controller
enable_single_controller: True
Expand Down
3 changes: 2 additions & 1 deletion benchmarks/maxtext_xpk_runner.py
Original file line number Diff line number Diff line change
Expand Up @@ -310,6 +310,7 @@ def build_user_command(
f' {libtpu_flags}'
# f' echo {model.tuning_params["sa_block_q"]}-q-dq-{model.tuning_params["sa_block_q_dq"]}-q-dkv-{model.tuning_params["sa_block_q_dkv"]} &&'
# f' echo {model.tuning_params["ici_fsdp_parallelism"]} {model.tuning_params["ici_tensor_parallelism"]} &&'
f' export ENABLE_PATHWAYS_PERSISTENCE=1 &&'
f' export JAX_PLATFORMS={jax_platforms} &&'
# f' export JAX_DEBUG_NANS=True &&'
# f' export TPU_MEGACORE=megachip_tccontrol &&'
Expand All @@ -326,7 +327,7 @@ def build_user_command(
' vertex_tensorboard_project="" vertex_tensorboard_region=""'
f' run_name="{pathways_prefix}{run_name}"'
f' enable_checkpointing=True'
f' checkpoint_period=40'
f' checkpoint_period=80'
f' async_checkpointing=True'
)

Expand Down

0 comments on commit 4f321d7

Please sign in to comment.