You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
tasks: Annotated[str, Argument(help="Comma-separated list of tasks to evaluate on.")],
46
46
# === Common parameters ===
47
47
dataset_loading_processes: Annotated[
48
-
int, Option(help="Number of processes to use for dataset loading.", rich_help_panel=HELP_PANNEL_NAME_1)
48
+
int, Option(help="Number of processes to use for dataset loading.", rich_help_panel=HELP_PANEL_NAME_1)
49
49
] =1,
50
50
custom_tasks: Annotated[
51
-
Optional[str], Option(help="Path to custom tasks directory.", rich_help_panel=HELP_PANNEL_NAME_1)
51
+
Optional[str], Option(help="Path to custom tasks directory.", rich_help_panel=HELP_PANEL_NAME_1)
52
52
] =None,
53
53
num_fewshot_seeds: Annotated[
54
-
int, Option(help="Number of seeds to use for few-shot evaluation.", rich_help_panel=HELP_PANNEL_NAME_1)
54
+
int, Option(help="Number of seeds to use for few-shot evaluation.", rich_help_panel=HELP_PANEL_NAME_1)
55
55
] =1,
56
+
remove_reasoning_tags: Annotated[
57
+
bool, Option(help="Remove reasoning tags from responses.", rich_help_panel=HELP_PANEL_NAME_1)
58
+
] =True,
59
+
reasoning_tags: Annotated[
60
+
str|None,
61
+
Option(
62
+
help="List of reasoning tags (provided as pairs) to remove from responses. Default is [('<think>', '</think>')].",
63
+
rich_help_panel=HELP_PANEL_NAME_1,
64
+
),
65
+
] =None,
56
66
# === saving ===
57
67
output_dir: Annotated[
58
-
str, Option(help="Output directory for evaluation results.", rich_help_panel=HELP_PANNEL_NAME_2)
68
+
str, Option(help="Output directory for evaluation results.", rich_help_panel=HELP_PANEL_NAME_2)
59
69
] ="results",
60
70
results_path_template: Annotated[
61
71
str|None,
62
72
Option(
63
73
help="Template path for where to save the results, you have access to 3 variables, `output_dir`, `org` and `model`. for example a template can be `'{output_dir}/1234/{org}+{model}'`",
64
-
rich_help_panel=HELP_PANNEL_NAME_2,
74
+
rich_help_panel=HELP_PANEL_NAME_2,
65
75
),
66
76
] =None,
67
77
push_to_hub: Annotated[
68
-
bool, Option(help="Push results to the huggingface hub.", rich_help_panel=HELP_PANNEL_NAME_2)
78
+
bool, Option(help="Push results to the huggingface hub.", rich_help_panel=HELP_PANEL_NAME_2)
69
79
] =False,
70
80
push_to_tensorboard: Annotated[
71
-
bool, Option(help="Push results to tensorboard.", rich_help_panel=HELP_PANNEL_NAME_2)
81
+
bool, Option(help="Push results to tensorboard.", rich_help_panel=HELP_PANEL_NAME_2)
72
82
] =False,
73
83
public_run: Annotated[
74
-
bool, Option(help="Push results and details to a public repo.", rich_help_panel=HELP_PANNEL_NAME_2)
84
+
bool, Option(help="Push results and details to a public repo.", rich_help_panel=HELP_PANEL_NAME_2)
75
85
] =False,
76
86
results_org: Annotated[
77
-
Optional[str], Option(help="Organization to push results to.", rich_help_panel=HELP_PANNEL_NAME_2)
87
+
Optional[str], Option(help="Organization to push results to.", rich_help_panel=HELP_PANEL_NAME_2)
78
88
] =None,
79
89
save_details: Annotated[
80
-
bool, Option(help="Save detailed, sample per sample, results.", rich_help_panel=HELP_PANNEL_NAME_2)
90
+
bool, Option(help="Save detailed, sample per sample, results.", rich_help_panel=HELP_PANEL_NAME_2)
81
91
] =False,
82
92
# === debug ===
83
93
max_samples: Annotated[
84
-
Optional[int], Option(help="Maximum number of samples to evaluate on.", rich_help_panel=HELP_PANNEL_NAME_3)
94
+
Optional[int], Option(help="Maximum number of samples to evaluate on.", rich_help_panel=HELP_PANEL_NAME_3)
85
95
] =None,
86
96
job_id: Annotated[
87
-
int, Option(help="Optional job id for future refenrence.", rich_help_panel=HELP_PANNEL_NAME_3)
97
+
int, Option(help="Optional job id for future refenrence.", rich_help_panel=HELP_PANEL_NAME_3)
0 commit comments