mirror of https://github.com/inclusionAI/AReaL
0724_merge7
This commit is contained in:
parent
13fc236c99
commit
27fd51aa15
|
@ -185,8 +185,6 @@ def main(args):
|
|||
stats_tracker.scope("grpo_actor"),
|
||||
):
|
||||
stats = actor.ppo_update(batch)
|
||||
wandb.log({"actor_reward": stats[0]["grpo_actor/final_reward/avg"]})
|
||||
wandb.log({"task_reward": stats[0]["grpo_actor/task_reward/avg"]})
|
||||
actor.step_lr_scheduler()
|
||||
log_gpu_stats("ppo update")
|
||||
|
||||
|
|
Loading…
Reference in New Issue