Text Generation
Transformers
Safetensors
English
ddllama
conversational
custom_code
xuan-luo commited on
Commit
793dca0
·
verified ·
1 Parent(s): 2cff985

Update evals/evals.sh

Browse files
Files changed (1) hide show
  1. evals/evals.sh +6 -6
evals/evals.sh CHANGED
@@ -1,6 +1,6 @@
1
- CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 accelerate launch --main_process_port 29500 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks mmlu --num_fewshot 5 --apply_chat_template --fewshot_as_multiturn --batch_size 4 > 1-mmlu.out 2>&1
2
- CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 accelerate launch --main_process_port 29500 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks hellaswag --num_fewshot 5 --apply_chat_template --fewshot_as_multiturn --batch_size 4 > 2-hellaswag.out 2>&1
3
- CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 accelerate launch --main_process_port 29500 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks winogrande --num_fewshot 5 --apply_chat_template --fewshot_as_multiturn --batch_size 8 > 3-winogrande.out 2>&1
4
- CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 accelerate launch --main_process_port 29500 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks gsm8k --num_fewshot 5 --apply_chat_template --fewshot_as_multiturn --batch_size 4 > 4-gsm8k.out 2>&1
5
- CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 accelerate launch --main_process_port 29500 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks humaneval --batch_size 4 --confirm_run_unsafe_code > 5-humaneval.out 2>&1
6
- CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 accelerate launch --main_process_port 29500 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks coqa --batch_size 4 > 6-coqa.out 2>&1
 
1
+ accelerate launch --main_process_port 29501 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks mmlu --num_fewshot 5 --apply_chat_template --fewshot_as_multiturn --batch_size 16 > 1-mmlu.out 2>&1
2
+ accelerate launch --main_process_port 29501 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks hellaswag --num_fewshot 5 --apply_chat_template --fewshot_as_multiturn --batch_size 16 > 2-hellaswag.out 2>&1
3
+ accelerate launch --main_process_port 29501 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks winogrande --num_fewshot 5 --apply_chat_template --fewshot_as_multiturn --batch_size 16 > 3-winogrande.out 2>&1
4
+ accelerate launch --main_process_port 29501 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks gsm8k --num_fewshot 5 --apply_chat_template --fewshot_as_multiturn --batch_size 16 > 4-gsm8k-ori.out 2>&1
5
+ accelerate launch --main_process_port 29501 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks humaneval --batch_size 16 --confirm_run_unsafe_code > 5-humaneval.out 2>&1
6
+ accelerate launch --main_process_port 29501 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks coqa --batch_size 16 > 6-coqa.out 2>&1