diff --git a/trainers/rewards/custom_rewards.py b/trainers/rewards/custom_rewards.py index 54cf724..09faf58 100644 --- a/trainers/rewards/custom_rewards.py +++ b/trainers/rewards/custom_rewards.py @@ -44,6 +44,8 @@ def custom_reward_func(completions: List[str], **kwargs) -> List[float]: # - Check for specific patterns or keywords # - Validate output format # - Score based on custom criteria + _ = completion # Placeholder use; replace with real scoring logic + _ = completion # Placeholder use; replace with real scoring logic reward = 0.0 # Placeholder: currently returns 0.0 rewards.append(reward) # =========================================