Fix orbax

1b81fc0d · sbl1996@126.com · d9334955 · 1b81fc0d
Commit 1b81fc0d authored Jun 29, 2024 by sbl1996@126.com
Show whitespace changes
Inline Side-by-side

Showing with 4 additions and 3 deletions

scripts/cleanba_nnx.py scripts/cleanba_nnx.py +4 -3

No files found.
--- a/scripts/cleanba_nnx.py
+++ b/scripts/cleanba_nnx.py
@@ -1154,10 +1154,10 @@ def main():
            *list(zip(*sharded_data_list)),
            learner_keys,
        )
-        unreplicated_params = flax.jax_utils.unreplicate(get_state(agent_state))
+        new_state = get_state(agent_state)
        params_queue_put_time = 0
        for d_idx, d_id in enumerate(args.actor_device_ids):
-            device_params = jax.device_put(unreplicated_params, local_devices[d_id])
+            device_params = jax.device_put(flax.jax_utils.unreplicate(new_state), local_devices[d_id])
            device_params["encoder"]['id_embed']["embedding"].value.block_until_ready()
            params_queue_put_start = time.time()
            for thread_id in range(args.num_actor_threads):
@@ -1197,7 +1197,8 @@ def main():
        if learner_policy_version % args.save_interval == 0 and not args.debug:
            M_steps = tb_global_step // 2**20
            ckpt_name = f"{timestamp}_{M_steps}M"
-            ckpt_maneger.save(unreplicated_params, ckpt_name)
+            new_state = jax.tree.map(orbax.utils.fully_replicated_host_local_array_to_global_array, new_state)
+            ckpt_maneger.save(new_state, ckpt_name)
        if learner_policy_version >= args.num_updates:
            break