Folder where you want to save samples/evaluations:
export SAVE_DIR=SET ME!
Folder where you want to save tmp files for MiniF2F-MATH evaluation, and create cache directory structure:
export SCRATCH_DIR=SET ME!
mkdir $SCRATCH_DIR
mkdir $SCRATCH_DIR/cache
mkdir $SCRATCH_DIR/lean_tmp
export SAVE_DIR=/matx/u/bcabrown/test_monkeys2 export SCRATCH_DIR=/scr/bcabrown/lean_scratch
python llmonk/generate/gsm8k.py model=meta-llama/Meta-Llama-3-8B-Instruct save_dir=$SAVE_DIR/gsm8k_samples --list vllm_args --disable-log-requests list-- --list stop_strings Q: Question: list--
python llmonk/generate/MATH.py model=meta-llama/Meta-Llama-3-8B-Instruct save_dir=$SAVE_DIR/math_samples --list vllm_args --disable-log-requests list-- --list stop_strings Problem: list--
python llmonk/generate/code_contests.py model=meta-llama/Meta-Llama-3-8B-Instruct save_dir=$SAVE_DIR/cc_samples --list vllm_args --disable-log-requests list-- --list stop_strings Q: Question: list--
python llmonk/generate/minif2f.py model=meta-llama/Meta-Llama-3-8B-Instruct save_dir=$SAVE_DIR/minif2f_samples --list vllm_args --disable-log-requests list-- --list stop_strings 'Write a lean4' list--
python llmonk/evaluate/math_datasets.py samples_dir=$SAVE_DIR/gsm8k_samples save_dir=$SAVE_DIR/math_eval dset=gsm8k
python llmonk/evaluate/math_datasets.py samples_dir=$SAVE_DIR/math_samples save_dir=$SAVE_DIR/math_eval dset=math
python llmonk/evaluate/code_contests.py samples_dir=$SAVE_DIR/cc_samples save_dir=$SAVE_DIR/cc_eval
CONTAINER=native CACHE_DIR=$SCRATCH_DIR/cache TMP_DIR=$SCRATCH_DIR/lean_tmp python llmonk/evaluate/minif2f.py samples_dir=$SAVE_DIR/minif2f_samples save_dir=$SAVE_DIR/minif2f_eval
python llmonk/tests/code_contests.py
CONTAINER=native CACHE_DIR=$SCRATCH_DIR/cache TMP_DIR=$SCRATCH_DIR/lean_tmp python llmonk/tests/minif2f.py