Skip to content

Commit

Permalink
add yamls
Browse files Browse the repository at this point in the history
  • Loading branch information
JvThunder committed Mar 18, 2024
1 parent eeac250 commit 008a6cb
Show file tree
Hide file tree
Showing 10 changed files with 156 additions and 2 deletions.
7 changes: 5 additions & 2 deletions lmms_eval/tasks/olympiadbench/olympiadbench.yaml
Original file line number Diff line number Diff line change
@@ -1,6 +1,9 @@
group: olympiadbench
task:
- olympiadbench_test
- olympiadbench_test_auto_scoring
- olympiadbench_test_math_en_comp
- olympiadbench_test_math_zh_comp
- olympiadbench_test_math_zh_cee
- olympiadbench_test_physics_en_comp
- olympiadbench_test_physics_zh_cee
metadata:
- version: 0.0
6 changes: 6 additions & 0 deletions lmms_eval/tasks/olympiadbench/olympiadbench_test_en.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
group: olympiadbench_test_en
task:
- olympiadbench_test_math_en_comp
- olympiadbench_test_physics_en_comp
metadata:
- version: 0.0
7 changes: 7 additions & 0 deletions lmms_eval/tasks/olympiadbench/olympiadbench_test_math.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,7 @@
group: olympiadbench_test_math
task:
- olympiadbench_test_math_en_comp
- olympiadbench_test_math_zh_comp
- olympiadbench_test_math_zh_cee
metadata:
- version: 0.0
25 changes: 25 additions & 0 deletions lmms_eval/tasks/olympiadbench/olympiadbench_test_math_en_comp.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,25 @@
dataset_path: lmms-lab/OlympiadBench
dataset_kwargs:
token: True
task : "olympiadbench_test_math_en_comp"
test_split: test_math_en_comp
output_type: generate_until
doc_to_visual: !function utils.olympiadbench_doc_to_visual
doc_to_text: !function utils.olympiadbench_doc_to_text
doc_to_target: "answer"
generation_kwargs:
until:
- "ASSISTANT:"
max_new_tokens: 1024
temperature: 0
top_p: 0
num_beams: 1
do_sample: false
process_results: !function utils.olympiadbench_process_results
metric_list:
- metric: submission
aggregation: !function utils.olympiadbench_aggregate_results
higher_is_better: true
- metric: exact_match
aggregation: mean
higher_is_better: true
25 changes: 25 additions & 0 deletions lmms_eval/tasks/olympiadbench/olympiadbench_test_math_zh_cee.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,25 @@
dataset_path: lmms-lab/OlympiadBench
dataset_kwargs:
token: True
task : "olympiadbench_test_math_zh_cee"
test_split: test_math_zh_cee
output_type: generate_until
doc_to_visual: !function utils.olympiadbench_doc_to_visual
doc_to_text: !function utils.olympiadbench_doc_to_text
doc_to_target: "answer"
generation_kwargs:
until:
- "ASSISTANT:"
max_new_tokens: 1024
temperature: 0
top_p: 0
num_beams: 1
do_sample: false
process_results: !function utils.olympiadbench_process_results
metric_list:
- metric: submission
aggregation: !function utils.olympiadbench_aggregate_results
higher_is_better: true
- metric: exact_match
aggregation: mean
higher_is_better: true
25 changes: 25 additions & 0 deletions lmms_eval/tasks/olympiadbench/olympiadbench_test_math_zh_comp.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,25 @@
dataset_path: lmms-lab/OlympiadBench
dataset_kwargs:
token: True
task : "olympiadbench_test_math_zh_comp"
test_split: test_math_zh_comp
output_type: generate_until
doc_to_visual: !function utils.olympiadbench_doc_to_visual
doc_to_text: !function utils.olympiadbench_doc_to_text
doc_to_target: "answer"
generation_kwargs:
until:
- "ASSISTANT:"
max_new_tokens: 1024
temperature: 0
top_p: 0
num_beams: 1
do_sample: false
process_results: !function utils.olympiadbench_process_results
metric_list:
- metric: submission
aggregation: !function utils.olympiadbench_aggregate_results
higher_is_better: true
- metric: exact_match
aggregation: mean
higher_is_better: true
6 changes: 6 additions & 0 deletions lmms_eval/tasks/olympiadbench/olympiadbench_test_physics.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
group: olympiadbench_test_physics
task:
- olympiadbench_test_physics_en_comp
- olympiadbench_test_physics_zh_cee
metadata:
- version: 0.0
Original file line number Diff line number Diff line change
@@ -0,0 +1,25 @@
dataset_path: lmms-lab/OlympiadBench
dataset_kwargs:
token: True
task : "olympiadbench_test_physics_en_comp"
test_split: test_physics_en_comp
output_type: generate_until
doc_to_visual: !function utils.olympiadbench_doc_to_visual
doc_to_text: !function utils.olympiadbench_doc_to_text
doc_to_target: "answer"
generation_kwargs:
until:
- "ASSISTANT:"
max_new_tokens: 1024
temperature: 0
top_p: 0
num_beams: 1
do_sample: false
process_results: !function utils.olympiadbench_process_results
metric_list:
- metric: submission
aggregation: !function utils.olympiadbench_aggregate_results
higher_is_better: true
- metric: exact_match
aggregation: mean
higher_is_better: true
Original file line number Diff line number Diff line change
@@ -0,0 +1,25 @@
dataset_path: lmms-lab/OlympiadBench
dataset_kwargs:
token: True
task : "olympiadbench_test_physics_zh_cee"
test_split: test_physics_zh_cee
output_type: generate_until
doc_to_visual: !function utils.olympiadbench_doc_to_visual
doc_to_text: !function utils.olympiadbench_doc_to_text
doc_to_target: "answer"
generation_kwargs:
until:
- "ASSISTANT:"
max_new_tokens: 1024
temperature: 0
top_p: 0
num_beams: 1
do_sample: false
process_results: !function utils.olympiadbench_process_results
metric_list:
- metric: submission
aggregation: !function utils.olympiadbench_aggregate_results
higher_is_better: true
- metric: exact_match
aggregation: mean
higher_is_better: true
7 changes: 7 additions & 0 deletions lmms_eval/tasks/olympiadbench/olympiadbench_test_zh.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,7 @@
group: olympiadbench_test_zh
task:
- olympiadbench_test_math_zh_comp
- olympiadbench_test_math_zh_cee
- olympiadbench_test_physics_zh_cee
metadata:
- version: 0.0

0 comments on commit 008a6cb

Please sign in to comment.