diff --git a/docs/release/TRAJECTORIES.md b/docs/release/TRAJECTORIES.md index 6e590cb84..bb15cdd0b 100644 --- a/docs/release/TRAJECTORIES.md +++ b/docs/release/TRAJECTORIES.md @@ -447,7 +447,6 @@ sampling_args = { "extra_body": { "return_tokens_as_token_ids": True, # Return tokens as token IDs "return_token_ids": True, # Include token_ids in response - "prompt_logprobs": 1, # Optional: include prompt logprobs }, } ``` diff --git a/verifiers/rl/trainer/config.py b/verifiers/rl/trainer/config.py index 49c1824f6..60c5626eb 100644 --- a/verifiers/rl/trainer/config.py +++ b/verifiers/rl/trainer/config.py @@ -321,7 +321,6 @@ def __post_init__(self): "include_stop_str_in_output": False, "return_tokens_as_token_ids": True, "return_token_ids": True, - "prompt_logprobs": True, }, } self.gradient_accumulation_steps = 1 diff --git a/verifiers/utils/token_utils.py b/verifiers/utils/token_utils.py index cee53df59..eefe2cabd 100644 --- a/verifiers/utils/token_utils.py +++ b/verifiers/utils/token_utils.py @@ -73,7 +73,7 @@ def prepare_sampling_args_for_token_prompts( ) -> SamplingArgs: """Ensures necessary fields are set for token prompts to work.""" sampling_args["logprobs"] = True - extra_body = dict(return_token_ids=True, prompt_logprobs=True) + extra_body = dict(return_token_ids=True) if "extra_body" in sampling_args: sampling_args["extra_body"].update(extra_body) else: