From b1ee6c95f1cb5d05286ca785bc4d14101ee89e5b Mon Sep 17 00:00:00 2001 From: Jackmin801 Date: Thu, 25 Dec 2025 23:36:00 -0800 Subject: [PATCH] no prompt logprobs please --- docs/release/TRAJECTORIES.md | 1 - verifiers/rl/trainer/config.py | 1 - verifiers/utils/token_utils.py | 2 +- 3 files changed, 1 insertion(+), 3 deletions(-) diff --git a/docs/release/TRAJECTORIES.md b/docs/release/TRAJECTORIES.md index 6e590cb84..bb15cdd0b 100644 --- a/docs/release/TRAJECTORIES.md +++ b/docs/release/TRAJECTORIES.md @@ -447,7 +447,6 @@ sampling_args = { "extra_body": { "return_tokens_as_token_ids": True, # Return tokens as token IDs "return_token_ids": True, # Include token_ids in response - "prompt_logprobs": 1, # Optional: include prompt logprobs }, } ``` diff --git a/verifiers/rl/trainer/config.py b/verifiers/rl/trainer/config.py index 49c1824f6..60c5626eb 100644 --- a/verifiers/rl/trainer/config.py +++ b/verifiers/rl/trainer/config.py @@ -321,7 +321,6 @@ def __post_init__(self): "include_stop_str_in_output": False, "return_tokens_as_token_ids": True, "return_token_ids": True, - "prompt_logprobs": True, }, } self.gradient_accumulation_steps = 1 diff --git a/verifiers/utils/token_utils.py b/verifiers/utils/token_utils.py index cee53df59..eefe2cabd 100644 --- a/verifiers/utils/token_utils.py +++ b/verifiers/utils/token_utils.py @@ -73,7 +73,7 @@ def prepare_sampling_args_for_token_prompts( ) -> SamplingArgs: """Ensures necessary fields are set for token prompts to work.""" sampling_args["logprobs"] = True - extra_body = dict(return_token_ids=True, prompt_logprobs=True) + extra_body = dict(return_token_ids=True) if "extra_body" in sampling_args: sampling_args["extra_body"].update(extra_body) else: