This commit is contained in:
Jake Poznanski 2025-08-21 17:11:33 +00:00
parent 6fe630516a
commit de719edf49

View File

@ -170,9 +170,10 @@ class OlmOCRDataset(Dataset):
# Return None if processing fails # Return None if processing fails
return None return None
def simple_length_reward(completions_ids, **kwargs): def simple_length_reward(completion_ids, **kwargs):
"""Reward function that assigns higher scores to longer completions (in terms of token count).""" """Reward function that assigns higher scores to longer completions (in terms of token count)."""
return [float(len(ids)) for ids in completions_ids] logger.info(f"Reward function called {kwargs}")
return [float(len(ids)) for ids in completion_ids]
def main(): def main():