Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
11 changes: 10 additions & 1 deletion configs/zero3.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,15 @@ deepspeed_config:
zero3_init_flag: true
zero3_save_16bit_model: true
zero_stage: 3
overlap_comm: true
contiguous_gradients: true
reduce_bucket_size: 5e8
stage3_prefetch_bucket_size: 5e8
stage3_param_persistence_threshold: 1e5
sub_group_size: 1e5
dump_state: false
gradient_clipping: auto

distributed_type: DEEPSPEED
downcast_bf16: 'no'
machine_rank: 0
Expand All @@ -19,4 +28,4 @@ same_network: true
tpu_env: []
tpu_use_cluster: false
tpu_use_sudo: false
use_cpu: false
use_cpu: false
2 changes: 1 addition & 1 deletion pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -6,7 +6,7 @@ authors = [
version = "0.1.0"
description = "Verifiers for reinforcement learning with LLMs"
license = {text = "MIT"}
requires-python = ">=3.11"
requires-python = "==3.12.2"
dependencies = [
"huanzhi-utils",
"scikit-learn",
Expand Down
16 changes: 8 additions & 8 deletions verifiers/tools/bfcl_tools.py
Original file line number Diff line number Diff line change
Expand Up @@ -3,14 +3,14 @@
import json

INVOLVED_CLASS_TO_FUNC_DOC_PATH = {
"GorillaFileSystem": "/root/richard/test/verifiers/verifiers/tools/bfcl_tools/gorilla_file_system.json",
"MathAPI": "/root/richard/test/verifiers/verifiers/tools/bfcl_tools/math_api.json",
"MessageAPI": "/root/richard/test/verifiers/verifiers/tools/bfcl_tools/message_api.json",
"TwitterAPI": "/root/richard/test/verifiers/verifiers/tools/bfcl_tools/posting_api.json",
"TicketAPI": "/root/richard/test/verifiers/verifiers/tools/bfcl_tools/ticket_api.json",
"TradingBot": "/root/richard/test/verifiers/verifiers/tools/bfcl_tools/trading_bot.json",
"TravelAPI": "/root/richard/test/verifiers/verifiers/tools/bfcl_tools/travel_booking.json",
"VehicleControlAPI": "/root/richard/test/verifiers/verifiers/tools/bfcl_tools/vehicle_control.json",
"GorillaFileSystem": "verifiers/tools/bfcl_tools/gorilla_file_system.json",
"MathAPI": "verifiers/tools/bfcl_tools/math_api.json",
"MessageAPI": "verifiers/tools/bfcl_tools/message_api.json",
"TwitterAPI": "verifiers/tools/bfcl_tools/posting_api.json",
"TicketAPI": "verifiers/tools/bfcl_tools/ticket_api.json",
"TradingBot": "verifiers/tools/bfcl_tools/trading_bot.json",
"TravelAPI": "verifiers/tools/bfcl_tools/travel_booking.json",
"VehicleControlAPI": "verifiers/tools/bfcl_tools/vehicle_control.json",
}

def construct_tools_from_involved_classes(involved_classes: List[str]) -> str:
Expand Down
4 changes: 2 additions & 2 deletions verifiers/utils/data_utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -106,8 +106,8 @@ def format_bfcl_prompt(system_prompt: str | None = None, involved_classes: List[

def preprocess_bfcl_dataset(system_prompt: str | None = None, curriculum_learning: bool = False) -> Dataset:
# TODO: Change to local path
multi_turn_base_data = load_file("/root/richard/test/verifiers/verifiers/berkeley-function-call-leaderboard/data/BFCL_v3_multi_turn_base.json")
multi_turn_base_answer = load_file("/root/richard/test/verifiers/verifiers/berkeley-function-call-leaderboard/data/possible_answer/BFCL_v3_multi_turn_base.json")
multi_turn_base_data = load_file("verifiers/berkeley-function-call-leaderboard/data/BFCL_v3_multi_turn_base.json")
multi_turn_base_answer = load_file("verifiers/berkeley-function-call-leaderboard/data/possible_answer/BFCL_v3_multi_turn_base.json")

# Reprocess the columns into serializable format and add num_turns
for i in range(len(multi_turn_base_data)):
Expand Down