From 55aa6eb74cd58c3c809b272f2950f0bc7ed91c2f Mon Sep 17 00:00:00 2001 From: Maximilian Ernestus Date: Mon, 8 Jan 2024 16:32:34 +0100 Subject: [PATCH] Ensure that PC does at least one comparison per iteration. --- src/imitation/algorithms/preference_comparisons.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/src/imitation/algorithms/preference_comparisons.py b/src/imitation/algorithms/preference_comparisons.py index 14a8fad5b..1b0a2b01b 100644 --- a/src/imitation/algorithms/preference_comparisons.py +++ b/src/imitation/algorithms/preference_comparisons.py @@ -1678,6 +1678,8 @@ def train( unnormalized_probs = vec_schedule(np.linspace(0, 1, self.num_iterations)) probs = unnormalized_probs / np.sum(unnormalized_probs) shares = util.oric(probs * total_comparisons) + shares[shares <= 0] = 1 # ensure we at least request one comparison per iteration + schedule = [initial_comparisons] + shares.tolist() print(f"Query schedule: {schedule}")