Skip to content

Commit

Permalink
Merge branch 'neurips_eval' into msaroufim/corr2cause
Browse files Browse the repository at this point in the history
  • Loading branch information
msaroufim authored Nov 8, 2023
2 parents 3901ff5 + 1111ae1 commit 8b40dd7
Showing 1 changed file with 88 additions and 4 deletions.
92 changes: 88 additions & 4 deletions private_run_specs.conf
Original file line number Diff line number Diff line change
@@ -1,6 +1,90 @@
entries: [
{description: "corr2cause:model=neurips/local", priority: 1}

{description: "sam_sum:model=neurips/local,max_train_instances=3", priority: 1}
{description: "ethics_utilitarianism:model=neurips/local", priority: 1}
entries: [
## Real

{description: "math:model=text_code,subject=number_theory,level=1,use_official_examples=True", priority: 2}
{description: "math:model=text_code,subject=intermediate_algebra,level=1,use_official_examples=True", priority: 2}
{description: "math:model=text_code,subject=algebra,level=1,use_official_examples=True", priority: 2}
{description: "math:model=text_code,subject=prealgebra,level=1,use_official_examples=True", priority: 2}
{description: "math:model=text_code,subject=geometry,level=1,use_official_examples=True", priority: 2}
{description: "math:model=text_code,subject=counting_and_probability,level=1,use_official_examples=True", priority: 2}
{description: "math:model=text_code,subject=precalculus,level=1,use_official_examples=True", priority: 2}

{description: "math:model=text_code,subject=number_theory,level=2,use_official_examples=True", priority: 4}
{description: "math:model=text_code,subject=intermediate_algebra,level=2,use_official_examples=True", priority: 4}
{description: "math:model=text_code,subject=algebra,level=2,use_official_examples=True", priority: 4}
{description: "math:model=text_code,subject=prealgebra,level=2,use_official_examples=True", priority: 4}
{description: "math:model=text_code,subject=geometry,level=2,use_official_examples=True", priority: 4}
{description: "math:model=text_code,subject=counting_and_probability,level=2,use_official_examples=True", priority: 4}
{description: "math:model=text_code,subject=precalculus,level=2,use_official_examples=True", priority: 4}

{description: "math:model=text_code,subject=number_theory,level=3,use_official_examples=True", priority: 3}
{description: "math:model=text_code,subject=intermediate_algebra,level=3,use_official_examples=True", priority: 3}
{description: "math:model=text_code,subject=algebra,level=3,use_official_examples=True", priority: 3}
{description: "math:model=text_code,subject=prealgebra,level=3,use_official_examples=True", priority: 3}
{description: "math:model=text_code,subject=geometry,level=3,use_official_examples=True", priority: 3}
{description: "math:model=text_code,subject=counting_and_probability,level=3,use_official_examples=True", priority: 3}
{description: "math:model=text_code,subject=precalculus,level=3,use_official_examples=True", priority: 3}

{description: "math:model=text_code,subject=number_theory,level=4,use_official_examples=True", priority: 4}
{description: "math:model=text_code,subject=intermediate_algebra,level=4,use_official_examples=True", priority: 4}
{description: "math:model=text_code,subject=algebra,level=4,use_official_examples=True", priority: 4}
{description: "math:model=text_code,subject=prealgebra,level=4,use_official_examples=True", priority: 4}
{description: "math:model=text_code,subject=geometry,level=4,use_official_examples=True", priority: 4}
{description: "math:model=text_code,subject=counting_and_probability,level=4,use_official_examples=True", priority: 4}
{description: "math:model=text_code,subject=precalculus,level=4,use_official_examples=True", priority: 4}

{description: "math:model=text_code,subject=number_theory,level=5,use_official_examples=True", priority: 3}
{description: "math:model=text_code,subject=intermediate_algebra,level=5,use_official_examples=True", priority: 3}
{description: "math:model=text_code,subject=algebra,level=5,use_official_examples=True", priority: 3}
{description: "math:model=text_code,subject=prealgebra,level=5,use_official_examples=True", priority: 3}
{description: "math:model=text_code,subject=geometry,level=5,use_official_examples=True", priority: 3}
{description: "math:model=text_code,subject=counting_and_probability,level=5,use_official_examples=True", priority: 3}
{description: "math:model=text_code,subject=precalculus,level=5,use_official_examples=True", priority: 3}

# With chain-of-thought prompting:
{description: "math:model=text_code,subject=number_theory,level=1,use_chain_of_thought=True", priority: 2}
{description: "math:model=text_code,subject=intermediate_algebra,level=1,use_chain_of_thought=True", priority: 2}
{description: "math:model=text_code,subject=algebra,level=1,use_chain_of_thought=True", priority: 2}
{description: "math:model=text_code,subject=prealgebra,level=1,use_chain_of_thought=True", priority: 2}
{description: "math:model=text_code,subject=geometry,level=1,use_chain_of_thought=True", priority: 2}
{description: "math:model=text_code,subject=counting_and_probability,level=1,use_chain_of_thought=True", priority: 2}
{description: "math:model=text_code,subject=precalculus,level=1,use_chain_of_thought=True", priority: 2}

{description: "math:model=text_code,subject=number_theory,level=2,use_chain_of_thought=True", priority: 4}
{description: "math:model=text_code,subject=intermediate_algebra,level=2,use_chain_of_thought=True", priority: 4}
{description: "math:model=text_code,subject=algebra,level=2,use_chain_of_thought=True", priority: 4}
{description: "math:model=text_code,subject=prealgebra,level=2,use_chain_of_thought=True", priority: 4}
{description: "math:model=text_code,subject=geometry,level=2,use_chain_of_thought=True", priority: 4}
{description: "math:model=text_code,subject=counting_and_probability,level=2,use_chain_of_thought=True", priority: 4}
{description: "math:model=text_code,subject=precalculus,level=2,use_chain_of_thought=True", priority: 4}

{description: "math:model=text_code,subject=number_theory,level=3,use_chain_of_thought=True", priority: 3}
{description: "math:model=text_code,subject=intermediate_algebra,level=3,use_chain_of_thought=True", priority: 3}
{description: "math:model=text_code,subject=algebra,level=3,use_chain_of_thought=True", priority: 3}
{description: "math:model=text_code,subject=prealgebra,level=3,use_chain_of_thought=True", priority: 3}
{description: "math:model=text_code,subject=geometry,level=3,use_chain_of_thought=True", priority: 3}
{description: "math:model=text_code,subject=counting_and_probability,level=3,use_chain_of_thought=True", priority: 3}
{description: "math:model=text_code,subject=precalculus,level=3,use_chain_of_thought=True", priority: 3}

{description: "math:model=text_code,subject=number_theory,level=4,use_chain_of_thought=True", priority: 4}
{description: "math:model=text_code,subject=intermediate_algebra,level=4,use_chain_of_thought=True", priority: 4}
{description: "math:model=text_code,subject=algebra,level=4,use_chain_of_thought=True", priority: 4}
{description: "math:model=text_code,subject=prealgebra,level=4,use_chain_of_thought=True", priority: 4}
{description: "math:model=text_code,subject=geometry,level=4,use_chain_of_thought=True", priority: 4}
{description: "math:model=text_code,subject=counting_and_probability,level=4,use_chain_of_thought=True", priority: 4}
{description: "math:model=text_code,subject=precalculus,level=4,use_chain_of_thought=True", priority: 4}

{description: "math:model=text_code,subject=number_theory,level=5,use_chain_of_thought=True", priority: 3}
{description: "math:model=text_code,subject=intermediate_algebra,level=5,use_chain_of_thought=True", priority: 3}
{description: "math:model=text_code,subject=algebra,level=5,use_chain_of_thought=True", priority: 3}
{description: "math:model=text_code,subject=prealgebra,level=5,use_chain_of_thought=True", priority: 3}
{description: "math:model=text_code,subject=geometry,level=5,use_chain_of_thought=True", priority: 3}
{description: "math:model=text_code,subject=counting_and_probability,level=5,use_chain_of_thought=True", priority: 3}
{description: "math:model=text_code,subject=precalculus,level=5,use_chain_of_thought=True", priority: 3}

{description: "sam_sum:model=neurips/local,max_train_instances=3", priority: 1}
{description: "ethics_utilitarianism:model=neurips/local", priority: 1}
{description: "corr2cause:model=neurips/local", priority: 1}

]

0 comments on commit 8b40dd7

Please sign in to comment.