-
Notifications
You must be signed in to change notification settings - Fork 6
/
Copy pathrun_tasks.sh
65 lines (52 loc) · 1.28 KB
/
run_tasks.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
#!/bin/bash
AGENT_MODEL=gpt-4o-2024-08-06
# AGENT_MODEL=claude-3-5-sonnet-20240620
# AGENT_MODEL=llama3.1-405b-instruct
TASK_CATEGORY=top_issue_identification
# RESULT_DIR=results_natural_1002
RESULT_DIR=results_tc_natural_1002
# AGENT_STRATEGY=react
AGENT_STRATEGY=tool_call
# LITELLM_PROVIDER=together_ai
# LITELLM_PROVIDER=bedrock
LITELLM_PROVIDER=openai
# LITELLM_PROVIDER=vertex_ai
EVAL_MODE=aided
LOG_DIR=logs_natural_1002
mkdir -p $LOG_DIR
python run_tasks.py \
--model $AGENT_MODEL \
--task_category $TASK_CATEGORY \
--agent_eval_mode $EVAL_MODE \
--log_dir $RESULT_DIR \
--agent_strategy $AGENT_STRATEGY \
--llm_provider $LITELLM_PROVIDER > ${LOG_DIR}/run_${AGENT_MODEL}_${AGENT_STRATEGY}_${TASK_CATEGORY}_${EVAL_MODE}.log 2>&1 &
## MODELS
# claude-3-5-sonnet-20240620
# claude-3-opus-20240229
# gpt-4o-2024-08-06
# gpt-3.5-turbo-0125
# llama3.1-8b-instruct
# llama3.1-70b-instruct
# llama3.1-405b-instruct
# mixtral_8x22b_instruct
## TASKS
# policy_violation_identification
# monthly_trend_analysis
# top_issue_identification
# named_entity_disambiguation
# best_region_identification
# handle_time
# knowledge_qa
# transfer_count
# case_routing
## PROVIDER
# bedrock
# openai
# together_ai
# vertex_ai
## AGENT_STRATEGY
# act
# react
# tool_call
# tool_call_flex