mirror of
https://github.com/knu-plml/apr-using-qlora.git
synced 2026-05-06 18:45:12 +00:00
14 KiB
14 KiB
Fine-tuning
codegen_6b_v5 (4090)
CUDA_VISIBLE_DEVICES="0" python sg_finetune.py \
--run_name codegen_6b_v5 \
--model_name_or_path ~/WorkspaceLabModels/codegen-6B \
--output_dir ../../nosync/output/codegen_6b_v5 \
--dataset ../../finetune_training.jsonl \
--validation_dataset ../../finetune_validation.jsonl \
--do_train \
--do_eval \
--learning_rate 0.0002 \
--seed 0 \
--max_length 768 \
--per_device_train_batch_size 8 \
--gradient_checkpointing \
--gradient_accumulation_steps 1 \
--num_train_epochs 1 \
--eval_steps 1000 \
--eval_dataset_size 1000 \
--per_device_eval_batch_size 1 \
--logging_steps 10 \
--report_to wandb
incoder_6b_v5 (4090)
CUDA_VISIBLE_DEVICES="1" python sg_finetune.py \
--run_name incoder_6b_v5 \
--model_name_or_path ~/WorkspaceLabModels/incoder-6B \
--output_dir ../../nosync/output/incoder_6b_v5 \
--dataset ../../finetune_training.jsonl \
--validation_dataset ../../finetune_validation.jsonl \
--do_train \
--do_eval \
--learning_rate 0.0002 \
--seed 0 \
--max_length 1024 \
--per_device_train_batch_size 8 \
--gradient_checkpointing \
--gradient_accumulation_steps 1 \
--num_train_epochs 1 \
--eval_steps 1000 \
--eval_dataset_size 1000 \
--per_device_eval_batch_size 1 \
--logging_steps 10 \
--report_to wandb
codellama_7b_v5 (4090)
CUDA_VISIBLE_DEVICES="2" python sg_finetune.py \
--run_name codellama_7b_v5 \
--model_name_or_path ~/WorkspaceLabModels/code_llama-7b-hf \
--output_dir ../../nosync/output/codellama_7b_v5 \
--dataset ../../finetune_training.jsonl \
--validation_dataset ../../finetune_validation.jsonl \
--do_train \
--do_eval \
--learning_rate 0.0002 \
--seed 0 \
--max_length 1024 \
--per_device_train_batch_size 8 \
--gradient_checkpointing \
--gradient_accumulation_steps 1 \
--num_train_epochs 1 \
--eval_steps 1000 \
--eval_dataset_size 1000 \
--per_device_eval_batch_size 1 \
--logging_steps 10 \
--report_to wandb
codellama_13b_v5 (a6000)
CUDA_VISIBLE_DEVICES="0" python sg_finetune.py \
--run_name codellama_13b_v5 \
--model_name_or_path ~/WorkspaceLabModels/code_llama-13b-hf \
--output_dir ../../nosync/output/codellama_13b_v5 \
--dataset ../../finetune_training.jsonl \
--validation_dataset ../../finetune_validation.jsonl \
--do_train \
--do_eval \
--learning_rate 0.0002 \
--seed 0 \
--max_length 1024 \
--per_device_train_batch_size 8 \
--gradient_checkpointing \
--gradient_accumulation_steps 1 \
--num_train_epochs 1 \
--eval_steps 2000 \
--eval_dataset_size 1000 \
--per_device_eval_batch_size 1 \
--logging_steps 10 \
--report_to wandb
codellama_34b_v5 (a6000)
CUDA_VISIBLE_DEVICES="1" python sg_finetune.py \
--run_name codellama_34b_v5 \
--model_name_or_path ~/WorkspaceLabModels/code_llama-34b-hf \
--output_dir ../../nosync/output/codellama_34b_v5 \
--dataset ../../finetune_training.jsonl \
--validation_dataset ../../finetune_validation.jsonl \
--do_train \
--do_eval \
--learning_rate 0.0001 \
--seed 0 \
--max_length 1024 \
--per_device_train_batch_size 4 \
--gradient_checkpointing \
--gradient_accumulation_steps 1 \
--num_train_epochs 1 \
--eval_steps 4000 \
--eval_dataset_size 1000 \
--max_eval_samples 1000 \
--per_device_eval_batch_size 1 \
--logging_steps 10 \
--lora_dropout 0.05 \
--report_to wandb
bf16 seed72
codegen_6b_v7 (4090)
CUDA_VISIBLE_DEVICES="0" python ./src/sg_finetune.py \
--run_name codegen_6b_v7 \
--model_name_or_path ~/WorkspaceLabModels/codegen_6b \
--output_dir ~/WorkspaceLabModels/codegen_6b_v7 \
--dataset ./data/finetune_training.jsonl \
--validation_dataset ./data/finetune_validation.jsonl \
--do_train \
--do_eval \
--learning_rate 0.0002 \
--seed 72 \
--max_length 768 \
--per_device_train_batch_size 8 \
--gradient_checkpointing \
--gradient_accumulation_steps 1 \
--num_train_epochs 1 \
--eval_steps 1000 \
--save_steps 1000 \
--specific_save_steps "13,125,1250,6250" \
--eval_dataset_size 1000 \
--per_device_eval_batch_size 1 \
--logging_steps 10 \
--report_to wandb
incoder_6b_v7 (4090)
CUDA_VISIBLE_DEVICES="1" python ./src/sg_finetune.py \
--run_name incoder_6b_v7 \
--model_name_or_path ~/WorkspaceLabModels/incoder_6b \
--output_dir ~/WorkspaceLabModels/incoder_6b_v7 \
--dataset ./data/finetune_training.jsonl \
--validation_dataset ./data/finetune_validation.jsonl \
--do_train \
--do_eval \
--learning_rate 0.0002 \
--seed 72 \
--max_length 1024 \
--per_device_train_batch_size 8 \
--gradient_checkpointing \
--gradient_accumulation_steps 1 \
--num_train_epochs 1 \
--eval_steps 1000 \
--save_steps 1000 \
--specific_save_steps "13,125,1250,6250" \
--eval_dataset_size 1000 \
--per_device_eval_batch_size 1 \
--logging_steps 10 \
--report_to wandb
codellama_7b_v7 (4090)
CUDA_VISIBLE_DEVICES="2" python ./src/sg_finetune.py \
--run_name codellama_7b_v7 \
--model_name_or_path ~/WorkspaceLabModels/codellama_7b \
--output_dir ~/WorkspaceLabModels/codellama_7b_v7 \
--dataset ./data/finetune_training.jsonl \
--validation_dataset ./data/finetune_validation.jsonl \
--do_train \
--do_eval \
--learning_rate 0.0002 \
--seed 72 \
--max_length 1024 \
--per_device_train_batch_size 8 \
--gradient_checkpointing \
--gradient_accumulation_steps 1 \
--num_train_epochs 1 \
--eval_steps 1000 \
--save_steps 1000 \
--specific_save_steps "13,125,1250,6250" \
--eval_dataset_size 1000 \
--per_device_eval_batch_size 1 \
--logging_steps 10 \
--report_to wandb
codellama_13b_v7 (A6000)
CUDA_VISIBLE_DEVICES="0" python ./src/sg_finetune.py \
--run_name codellama_13b_v7 \
--model_name_or_path ~/WorkspaceLabModels/codellama_13b \
--output_dir ~/WorkspaceLabModels/codellama_13b_v7 \
--dataset ./data/finetune_training.jsonl \
--validation_dataset ./data/finetune_validation.jsonl \
--do_train \
--do_eval \
--learning_rate 0.0002 \
--seed 72 \
--max_length 1024 \
--per_device_train_batch_size 8 \
--gradient_checkpointing \
--gradient_accumulation_steps 1 \
--num_train_epochs 1 \
--eval_steps 1000 \
--save_steps 1000 \
--specific_save_steps "13,125,1250,6250" \
--eval_dataset_size 1000 \
--per_device_eval_batch_size 1 \
--logging_steps 10 \
--report_to wandb
codellama_34b_v7 (A6000)
CUDA_VISIBLE_DEVICES="1" python ./src/sg_finetune.py \
--run_name codellama_34b_v7 \
--model_name_or_path ~/WorkspaceLabModels/codellama_34b \
--output_dir ~/WorkspaceLabModels/codellama_34b_v7 \
--dataset ./data/finetune_training.jsonl \
--validation_dataset ./data/finetune_validation.jsonl \
--do_train \
--do_eval \
--learning_rate 0.0001 \
--seed 72 \
--max_length 1024 \
--per_device_train_batch_size 4 \
--gradient_checkpointing \
--gradient_accumulation_steps 1 \
--num_train_epochs 1 \
--eval_steps 2000 \
--save_steps 2000 \
--specific_save_steps "25,250,2500,12500" \
--eval_dataset_size 1000 \
--max_eval_samples 1000 \
--per_device_eval_batch_size 1 \
--logging_steps 10 \
--lora_dropout 0.05 \
--report_to wandb
Benchmarks
# --do_humaneval
# --do_quixbugs
# --do_defects4j --strict_defects4j
# --do_generate
# --do_validate
CUDA_VISIBLE_DEVICES="0" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/codegen_6b \
--output_dir ~/WorkspaceLabModels/codegen_6b_v7 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 64 \
--do_humaneval \
--do_generate \
--do_validate
CUDA_VISIBLE_DEVICES="1" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/incoder_6b \
--output_dir ~/WorkspaceLabModels/incoder_6b_v7 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_humaneval \
--do_generate \
--do_validate
CUDA_VISIBLE_DEVICES="2" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/codellama_7b \
--output_dir ~/WorkspaceLabModels/codellama_7b_v7 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_humaneval \
--do_generate \
--do_validate
CUDA_VISIBLE_DEVICES="1" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/codellama_13b \
--output_dir ~/WorkspaceLabModels/codellama_13b_v5 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_defects4j \
--strict_defects4j \
--do_validate
CUDA_VISIBLE_DEVICES="0" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/codellama_34b \
--output_dir ~/WorkspaceLabModels/codellama_34b_v5 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_defects4j \
--strict_defects4j \
--do_validate
# do_defects4j 추가
CUDA_VISIBLE_DEVICES="0" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/codellama_7b \
--output_dir ~/WorkspaceLabModels/codellama_7b_v5 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_humaneval \
--do_generate \
--do_validate
CUDA_VISIBLE_DEVICES="0" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/incoder_6b \
--output_dir ~/WorkspaceLabModels/incoder_6b_v5 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_defects4j \
--do_generate \
--do_validate
CUDA_VISIBLE_DEVICES="0" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/codellama_7b \
--output_dir ~/WorkspaceLabModels/codellama_7b_v5 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_defects4j \
--do_validate
CUDA_VISIBLE_DEVICES="0" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/codegen_6b \
--output_dir ~/WorkspaceLabModels/codegen_6b_v5 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_defects4j \
--do_generate \
--do_validate
# codellama_13b_v5 집중 테스트
CUDA_VISIBLE_DEVICES="0" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/codellama_13b \
--output_dir ~/WorkspaceLabModels/codellama_13b_v5 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_humaneval \
--do_generate \
--do_validate
CUDA_VISIBLE_DEVICES="1" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/codellama_13b \
--output_dir ~/WorkspaceLabModels/codellama_13b_v5 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_quixbugs \
--do_generate \
--do_validate
CUDA_VISIBLE_DEVICES="0" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/codellama_13b \
--output_dir ~/WorkspaceLabModels/codellama_13b_v5 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_defects4j \
--do_generate \
--do_validate
# codellama_34b_v5 집중 테스트
CUDA_VISIBLE_DEVICES="0" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/codellama_34b \
--output_dir ~/WorkspaceLabModels/codellama_34b_v5 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_humaneval \
--do_generate \
--do_validate
CUDA_VISIBLE_DEVICES="1" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/codellama_34b \
--output_dir ~/WorkspaceLabModels/codellama_34b_v5 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_quixbugs \
--do_generate \
--do_validate
CUDA_VISIBLE_DEVICES="1" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/codellama_34b \
--output_dir ~/WorkspaceLabModels/codellama_34b_v5 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_defects4j \
--do_generate \
--do_validate
# incoder_6b_v5 humaneval 스탭별 테스트
CUDA_VISIBLE_DEVICES="1" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/incoder_6b \
--output_dir ~/WorkspaceLabModels/incoder_6b_v5/checkpoint-1000 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_humaneval \
--do_generate \
--do_validate
CUDA_VISIBLE_DEVICES="3" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/incoder_6b \
--output_dir ~/WorkspaceLabModels/incoder_6b_v5/checkpoint-2000 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_humaneval \
--do_generate \
--do_validate
CUDA_VISIBLE_DEVICES="2" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/incoder_6b \
--output_dir ~/WorkspaceLabModels/incoder_6b_v5/checkpoint-4000 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_humaneval \
--do_generate \
--do_validate
CUDA_VISIBLE_DEVICES="3" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/incoder_6b \
--output_dir ~/WorkspaceLabModels/incoder_6b_v5/checkpoint-8000 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_humaneval \
--do_generate \
--do_validate
CUDA_VISIBLE_DEVICES="2" python src/sg_bench.py \
--model_name_or_path ~/WorkspaceLabModels/incoder_6b \
--output_dir ~/WorkspaceLabModels/incoder_6b_v5/checkpoint-12000 \
--do_sample \
--seed 0 \
--num_beams 10 \
--max_new_tokens 128 \
--do_humaneval \
--do_generate \
--do_validate
DEBUG QuixBugs
javac -cp .:java_programs:junit4-4.12.jar:hamcrest-all-1.3.jar java_testcases/junit/GCD_TEST.java
java -cp .:java_programs:junit4-4.12.jar:hamcrest-all-1.3.jar org.junit.runner.JUnitCore java_testcases.junit.GCD_TEST
DEBUG defects4j
defects4j checkout -p Chart -v 4b -w /home/yglee/wl/p14/nosync/defects4j_tmp853/tmp