OptimalScale · research4pan · Apr 24, 2024 · Apr 23, 2024 · Apr 23, 2024 · Apr 23, 2024
diff --git a/scripts/run_finetune_with_lora.sh b/scripts/run_finetune_with_lora.sh
@@ -3,7 +3,8 @@
 
 # Parses arguments
 model_name_or_path=gpt2
-dataset_path=data/alpaca/train
+dataset_path=data/alpaca/train_conversation
+conversation_template=llama2
 output_dir=output_models/finetune
 deepspeed_args="--master_port=11000"
 
@@ -18,6 +19,10 @@ while [[ $# -ge 1 ]]; do
       dataset_path="$2"
       shift
       ;;
+    --conversation_template)
+      conversation_template="$2"
+      shift
+      ;;
     -o|--output_lora_path)
       output_dir="$2"
       shift
@@ -43,6 +48,7 @@ deepspeed ${deepspeed_args} \
   examples/finetune.py \
     --model_name_or_path ${model_name_or_path} \
     --dataset_path ${dataset_path} \
+    --conversation_template ${conversation_template} \
     --output_dir ${output_dir} --overwrite_output_dir \
     --num_train_epochs 0.01 \
     --learning_rate 1e-4 \

diff --git a/scripts/run_finetune_with_lora_save_aggregated_weights.sh b/scripts/run_finetune_with_lora_save_aggregated_weights.sh
@@ -3,7 +3,8 @@
 
 # Parses arguments
 model_name_or_path=gpt2
-dataset_path=data/alpaca/train
+dataset_path=data/alpaca/train_conversation
+conversation_template=llama2
 output_dir=output_models/finetune
 deepspeed_args="--master_port=11000"
 
@@ -18,6 +19,10 @@ while [[ $# -ge 1 ]]; do
       dataset_path="$2"
       shift
       ;;
+    --conversation_template)
+      conversation_template="$2"
+      shift
+      ;;
     -o|--output_model_path)
       output_dir="$2"
       shift
@@ -43,6 +48,7 @@ deepspeed ${deepspeed_args} \
   examples/finetune.py \
     --model_name_or_path ${model_name_or_path} \
     --dataset_path ${dataset_path} \
+    --conversation_template ${conversation_template} \
     --output_dir ${output_dir} --overwrite_output_dir \
     --num_train_epochs 0.01 \
     --learning_rate 1e-4 \

diff --git a/scripts/run_finetune_with_qlora_save_aggregated_weights.sh b/scripts/run_finetune_with_qlora_save_aggregated_weights.sh
@@ -3,7 +3,8 @@
 
 # Parses arguments
 model_name_or_path=meta-llama/Llama-2-13b-hf
-dataset_path=/home/paperspace/LMFlow/alpaca/train
+dataset_path=data/alpaca/train_conversation
+conversation_template=llama2
 output_dir=output_models/finetune
 deepspeed_args="--master_port=11000"
 
@@ -18,6 +19,10 @@ while [[ $# -ge 1 ]]; do
       dataset_path="$2"
       shift
       ;;
+    --conversation_template)
+      conversation_template="$2"
+      shift
+      ;;
     -o|--output_model_path)
       output_dir="$2"
       shift
@@ -43,6 +48,7 @@ deepspeed ${deepspeed_args} \
   examples/finetune.py \
     --model_name_or_path ${model_name_or_path} \
     --dataset_path ${dataset_path} \
+    --conversation_template ${conversation_template} \
     --output_dir ${output_dir} --overwrite_output_dir \
     --num_train_epochs 0.01 \
     --learning_rate 1e-4 \

diff --git a/src/lmflow/models/hf_decoder_model.py b/src/lmflow/models/hf_decoder_model.py
@@ -631,6 +631,7 @@ def tokenize_function(examples):
                 (
                     fingerprint
                     + str(self.tokenizer)
+                    + str(conversation_template) if dataset_type == "conversation" else ""
                     + f'###disable_group_texts={data_args.disable_group_texts}'
                     + f'###block_size={data_args.block_size}'
                 ).encode("utf-8")
@@ -818,7 +819,7 @@ def get_peft_without_qlora(self):
                 torch_dtype=torch_dtype,
                 device_map=device_map,
                 trust_remote_code = self.model_args.trust_remote_code,
-                attn_implementation="flash_attention_2" if model_args.use_flash_attention else None,
+                attn_implementation="flash_attention_2" if self.model_args.use_flash_attention else None,
             )
 
             self.backend_model = PeftModel.from_pretrained(self.backend_model_full, tmpdirname)