Skip to content

Commit

Permalink
Increase training time and numer of samples to compare in the PC perf…
Browse files Browse the repository at this point in the history
…ormance test.
  • Loading branch information
ernestum committed Oct 11, 2023
1 parent f053932 commit 1b20336
Showing 1 changed file with 3 additions and 3 deletions.
6 changes: 3 additions & 3 deletions tests/algorithms/test_preference_comparisons.py
Original file line number Diff line number Diff line change
Expand Up @@ -1068,7 +1068,7 @@ def test_that_trainer_improves(
novice_agent_rewards, _ = evaluation.evaluate_policy(
agent_trainer.algorithm.policy,
action_is_reward_venv,
25,
50,
return_episode_rewards=True,
)

Expand All @@ -1077,7 +1077,7 @@ def test_that_trainer_improves(
# after this training, and thus `later_rewards` should have lower loss.
first_reward_network_stats = main_trainer.train(20, 20)

later_reward_network_stats = main_trainer.train(50, 20)
later_reward_network_stats = main_trainer.train(100, 40)
assert (
first_reward_network_stats["reward_loss"]
> later_reward_network_stats["reward_loss"]
Expand All @@ -1087,7 +1087,7 @@ def test_that_trainer_improves(
trained_agent_rewards, _ = evaluation.evaluate_policy(
agent_trainer.algorithm.policy,
action_is_reward_venv,
25,
50,
return_episode_rewards=True,
)

Expand Down

0 comments on commit 1b20336

Please sign in to comment.