@@ -58,7 +58,7 @@ accelerate launch --main_process_port 30005 main.py \
5858 --tasks mercury \
5959 --n_samples 5 \
6060 --temperature 0.2 \
61- --batch_size 10 \
61+ --batch_size 1 \
6262 --allow_code_execution \
6363 --save_generations \
6464 --metric_output_path deepseek-coder-6.7b-base-mercury-result.json
@@ -137,7 +137,7 @@ accelerate launch --main_process_port 30011 main.py \
137137 --tasks mercury \
138138 --n_samples 5 \
139139 --temperature 0.2 \
140- --batch_size 5 \
140+ --batch_size 10 \
141141 --allow_code_execution \
142142 --save_generations \
143143 --metric_output_path starcoder2-3b-SFT-mercury-result.json
@@ -228,7 +228,48 @@ accelerate launch --main_process_port 30018 main.py \
228228 --tasks mercury \
229229 --n_samples 5 \
230230 --temperature 0.2 \
231+ --batch_size 5 \
232+ --allow_code_execution \
233+ --save_generations \
234+ --metric_output_path codeLlama-13b-hf-SFT-mercury-result.json
235+
236+ # deepseek-ai/deepseek-coder-33b-base SFT
237+ accelerate launch --main_process_port 30019 main.py \
238+ --model /home/mingzhe/Projects/Mercury/checkpoints/deepseek-ai/deepseek-coder-33b-base-sft-final_checkpoint \
239+ --load_in_4bit \
240+ --max_length_generation 2048 \
241+ --tasks mercury \
242+ --n_samples 5 \
243+ --temperature 0.2 \
244+ --batch_size 1 \
245+ --allow_code_execution \
246+ --save_generations \
247+ --metric_output_path deepseek-coder-33b-base-SFT-mercury-result.json
248+
249+ # codellama/CodeLlama-34b-hf SFT
250+ accelerate launch --main_process_port 30020 main.py \
251+ --model /home/mingzhe/Projects/Mercury/checkpoints/codellama/CodeLlama-34b-hf-sft-final_checkpoint \
252+ --load_in_4bit \
253+ --max_length_generation 2048 \
254+ --tasks mercury \
255+ --n_samples 5 \
256+ --temperature 0.2 \
257+ --batch_size 1 \
258+ --allow_code_execution \
259+ --save_generations \
260+ --metric_output_path codeLlama-34b-hf-SFT-mercury-result.json
261+
262+
263+
264+ # deepseek-ai/deepseek-coder-6.7b-base DPO
265+ accelerate launch --main_process_port 30025 main.py \
266+ --model /home/mingzhe/Projects/Mercury/checkpoints/deepseek-ai/deepseek-coder-6.7b-base-dpo-final_checkpoint \
267+ --load_in_4bit \
268+ --max_length_generation 2048 \
269+ --tasks mercury \
270+ --n_samples 5 \
271+ --temperature 0.2 \
231272 --batch_size 1 \
232273 --allow_code_execution \
233274 --save_generations \
234- --metric_output_path codeLlama-13b-hf-SFT -mercury-result.json
275+ --metric_output_path deepseek-coder-6.7b-base-DPO -mercury-result.json
0 commit comments