From 436071f3ee985dbad91eac6161630a679c873221 Mon Sep 17 00:00:00 2001 From: Yunkai Date: Wed, 18 Feb 2026 18:45:27 +0000 Subject: [PATCH] fix: pass gts argument in _dump_generations call in _train_step --- agentlightning/verl/trainer.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/agentlightning/verl/trainer.py b/agentlightning/verl/trainer.py index 413a0a1cf..bff5bccf2 100644 --- a/agentlightning/verl/trainer.py +++ b/agentlightning/verl/trainer.py @@ -417,10 +417,14 @@ def _train_step(self, batch_dict: dict) -> dict: print(batch.batch.keys()) inputs = self.tokenizer.batch_decode(batch.batch["prompts"], skip_special_tokens=True) outputs = self.tokenizer.batch_decode(batch.batch["responses"], skip_special_tokens=True) + sample_gts = [ + item.non_tensor_batch.get("reward_model", {}).get("ground_truth", None) for item in batch + ] scores = batch.batch["token_level_scores"].sum(-1).cpu().tolist() self._dump_generations( inputs=inputs, outputs=outputs, + gts=sample_gts, scores=scores, reward_extra_infos_dict=reward_extra_infos_dict, dump_path=rollout_data_dir,