Skip to content

Commit

Permalink
exp: mixtral all datasets
Browse files Browse the repository at this point in the history
  • Loading branch information
DriesSmit committed Apr 20, 2024
1 parent 893e513 commit 5f49e22
Show file tree
Hide file tree
Showing 11 changed files with 22 additions and 22 deletions.
2 changes: 1 addition & 1 deletion experiments/conf/config.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,7 @@ defaults:
- dataset: medqa # [options: usmle, medmcqa, mmlu, pubmedqa, medqa, ciar, cosmosqa, gpqa]
- _self_

max_eval_count: 100
max_eval_count: None
num_eval_workers: 1 # Each worker receives a full batch of questions.
eval_batch_size: 10 # Defaults to batch_size=1.
verbose: False
Expand Down
6 changes: 3 additions & 3 deletions experiments/conf/system/chateval.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -13,13 +13,13 @@ agreement_intensity: -1 # -1 for default behavior, otherwise {0, ..., 10} for ag
agents: # options: [gpt, palm]
# Agent 1
- - "${system.gpt}"
- engine: "gpt-4" # gpt uses gpt-3.5 engine
- engine: "mixtral-8x7b-instruct" # gpt uses gpt-3.5 engine
- prompt: "${system.agent_prompts.cot}"
# Agent 2
- - "${system.gpt}"
- engine: "gpt-4" # gpt uses gpt-3.5 engine
- engine: "mixtral-8x7b-instruct" # gpt uses gpt-3.5 engine
- prompt: "${system.agent_prompts.cot}"
# Summarizer
- - "${system.gpt}"
- engine: "gpt-4" # gpt uses gpt-3.5 engine
- engine: "mixtral-8x7b-instruct" # gpt uses gpt-3.5 engine
- prompt: "${system.agent_prompts.summarizer}"
6 changes: 3 additions & 3 deletions experiments/conf/system/debateqa.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -15,9 +15,9 @@ agents: # options: [gpt, palm]
# - prompt: "${system.agent_prompts.cot}"

# GPT-3.5 agent
- - "${system.gpt}"
- engine: "gpt-3.5-turbo-0613" # gpt uses gpt-3.5 engine
- prompt: "${system.agent_prompts.cot}"
# - - "${system.gpt}"
# - engine: "gpt-3.5-turbo-0613" # gpt uses gpt-3.5 engine
# - prompt: "${system.agent_prompts.cot}"

# PaLM agent
- - "${system.palm}" # palm uses default setup
Expand Down
2 changes: 1 addition & 1 deletion experiments/conf/system/ensemble_refinement.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -15,7 +15,7 @@ num_aggregation_steps: 1
agents: # options: [gpt, palm]
# GPT-3.5 agent
- - "${system.gpt}"
- engine: "gpt-4" # gpt uses gpt-3.5 engine
- engine: "mixtral-8x7b-instruct" # gpt uses gpt-3.5 engine
- prompt: "${system.agent_prompts.er_simple}"
- few_shot_examples: ${system.medpalm_examples.few_shot} # False, ${system.medpalm_examples.few_shot} or ${system.medpalm_examples.cot_few_shot}
- sampling:
Expand Down
6 changes: 3 additions & 3 deletions experiments/conf/system/google_mad.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -14,18 +14,18 @@ agreement_intensity: -1 # -1 for default behavior, otherwise {0, ..., 10} for ag
agents: # options: [gpt, palm]
# GPT-3.5 agent
- - "${system.gpt}"
- engine: "gpt-4" # gpt uses gpt-3.5 engine
- engine: "mixtral-8x7b-instruct" # gpt uses gpt-3.5 engine
- prompt: "${system.agent_prompts.simple}"
- few_shot_examples: ${system.medpalm_examples.few_shot} # None, ${system.medpalm_examples.few_shot} or ${system.medpalm_examples.cot_few_shot}

# GPT-3.5 agent
- - "${system.gpt}"
- engine: "gpt-4" # gpt uses gpt-3.5 engine
- engine: "mixtral-8x7b-instruct" # gpt uses gpt-3.5 engine
- prompt: "${system.agent_prompts.simple}"
- few_shot_examples: ${system.medpalm_examples.few_shot} # None, ${system.medpalm_examples.few_shot} or ${system.medpalm_examples.cot_few_shot}

# GPT-3.5 agent
- - "${system.gpt}"
- engine: "gpt-4" # gpt uses gpt-3.5 engine
- engine: "mixtral-8x7b-instruct" # gpt uses gpt-3.5 engine
- prompt: "${system.agent_prompts.simple}"
- few_shot_examples: ${system.medpalm_examples.few_shot} # None, ${system.medpalm_examples.few_shot} or ${system.medpalm_examples.cot_few_shot}
2 changes: 1 addition & 1 deletion experiments/conf/system/gpt.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -17,7 +17,7 @@ defaults: # options: [simple, cot, letter, explain...]: any prompt used in 'agen
gpt:
_target_: debatellm.agents.GPT
prompt: ${system.agent_prompts.simple}
engine: "gpt-3.5-turbo-0613"
engine: "mixtral-8x7b-instruct"
few_shot_examples: False # Options include: [False, ${system.medpalm_examples.few_shot}, ${system.medpalm_examples.cot_few_shot}]
mock: False
sampling:
Expand Down
2 changes: 1 addition & 1 deletion experiments/conf/system/medprompt.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -13,7 +13,7 @@ name: medprompt
agents: # options: [gpt, palm]
# GPT-3 agent
- - "${system.gpt}"
- engine: "gpt-4" # gpt uses gpt-4 engine
- engine: "mixtral-8x7b-instruct" # gpt uses gpt-4 engine
- cost_per_prompt_token: 0.03 # dollar costs per 1000 prompt token
- cost_per_response_token: 0.06 # dollar costs per 1000 response token
- prompt: "${system.agent_prompts.cot_medprompt}"
Expand Down
4 changes: 2 additions & 2 deletions experiments/conf/system/multi_agent_debate.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -11,9 +11,9 @@ num_rounds: 2
agents: # options: [gpt, palm]
# GPT-3.5 agent
- - "${system.gpt}"
- engine: "gpt-4" # gpt uses gpt-3.5 engine
- engine: "mixtral-8x7b-instruct" # gpt uses gpt-3.5 engine
- prompt: "${system.agent_prompts.cot}"
# GPT-3.5 agent
- - "${system.gpt}"
- engine: "gpt-4" # gpt uses gpt-3.5 engine
- engine: "mixtral-8x7b-instruct" # gpt uses gpt-3.5 engine
- prompt: "${system.agent_prompts.cot}"
2 changes: 1 addition & 1 deletion experiments/conf/system/spp_synergy.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -10,5 +10,5 @@ name: spp_synergy # Used for distinguishing between single agent GPT.
agents: # options: [gpt, palm]
# Agent 1
- - "${system.gpt}"
- engine: "gpt-4" # gpt uses gpt-3.5 engine
- engine: "mixtral-8x7b-instruct" # gpt uses gpt-3.5 engine
- prompt: "${system.agent_prompts.spp_original}" # options: [spp_expert, spp_original]
6 changes: 3 additions & 3 deletions experiments/conf/system/tsinghua_mad.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -14,21 +14,21 @@ agreement_intensity: -1 # -1: fallback to default prompt. [0, 1, ..., 10]: agree
agents: # options: [gpt, palm]
# Agent 1
- - "${system.gpt}"
- engine: "gpt-3.5-turbo-0613" # gpt uses gpt-3.5 engine
- engine: "mixtral-8x7b-instruct" # gpt uses gpt-3.5 engine
- prompt: "${system.agent_prompts.angel}"
- prompt_from_history: "tsinghua_mad"
- few_shot_examples: None # None, ${system.medpalm_examples.few_shot} or ${system.medpalm_examples.cot_few_shot}

# Agent 2
- - "${system.gpt}"
- engine: "gpt-3.5-turbo-0613" # gpt uses gpt-3.5 engine
- engine: "mixtral-8x7b-instruct" # gpt uses gpt-3.5 engine
- prompt: "${system.agent_prompts.devil}"
- prompt_from_history: "tsinghua_mad"
- few_shot_examples: None # None, ${system.medpalm_examples.few_shot} or ${system.medpalm_examples.cot_few_shot}

# Judge
- - "${system.gpt}"
- engine: "gpt-3.5-turbo-0613" # gpt uses gpt-3.5 engine
- engine: "mixtral-8x7b-instruct" # gpt uses gpt-3.5 engine
- prompt: "${system.agent_prompts.judge_tsinghua}"
- prompt_from_history: "tsinghua_judge"
- few_shot_examples: None # None, ${system.medpalm_examples.few_shot} or ${system.medpalm_examples.cot_few_shot}
Expand Down
6 changes: 3 additions & 3 deletions scripts/launch_experiments.py
Original file line number Diff line number Diff line change
Expand Up @@ -204,9 +204,9 @@
# Add all 3 datasets to the experiments
for exp in exp_table:
exp["dataset"] = [
# "cosmosqa",
# "ciar",
# "gpqa",
"cosmosqa",
"ciar",
"gpqa",
"medqa",
"pubmedqa",
"mmlu",
Expand Down

0 comments on commit 5f49e22

Please sign in to comment.