fix dataset parsing error (#540)

* fix dataset parsing error support defined question field to fix errors when datasets' question field is not 'problem' * add question field config add script_args: question field * refactor: datasets prompt column --------- Co-authored-by: lewtun <lewis.c.tunstall@gmail.com>
2025-03-28 20:17:04 +08:00
commit 1802bec75f
@@ -177,4 +177,5 @@ logs/
 eval_results/
 results/

-.vscode/
+.vscode/
+.python-version
@@ -154,3 +154,7 @@ class GRPOScriptArguments(trl.ScriptArguments):
            "help": "for each generation, evaluate these many test cases in parallel, then check if any of them failed (0 score): if so stop evaluating; otherwise continue with the next batch of test cases. Useful to avoid overloading the eval server + save time on wrong solutions"
        },
    )
+    dataset_prompt_column: str = field(
+        default="prompt",
+        metadata={"help": "Column to use as prompts for training."},
+    )
@@ -84,13 +84,16 @@ def main(script_args, training_args, model_args):
    reward_funcs = get_reward_funcs(script_args)

    # Format into conversation
-    def make_conversation(example):
+    def make_conversation(example, prompt_column: str = script_args.dataset_prompt_column):
        prompt = []

        if training_args.system_prompt is not None:
            prompt.append({"role": "system", "content": training_args.system_prompt})

-        prompt.append({"role": "user", "content": example["problem"]})
+        if prompt_column not in example:
+            raise ValueError(f"Dataset Question Field Error: {prompt_column} is not supported.")
+
+        prompt.append({"role": "user", "content": example[prompt_column]})
        return {"prompt": prompt}

    dataset = dataset.map(make_conversation)