From a529b4d912240f089be65d27cc5746ff6259636f Mon Sep 17 00:00:00 2001 From: Vineeth <48151992+Dornavineeth@users.noreply.github.com> Date: Wed, 30 Jul 2025 09:21:08 -0700 Subject: [PATCH] Added qwen support (#24) --- configs/model/Qwen2.5-1.5B-Instruct.yaml | 14 ++++++++++++++ configs/model/Qwen2.5-3B-Instruct.yaml | 14 ++++++++++++++ configs/model/Qwen2.5-7B-Instruct.yaml | 14 ++++++++++++++ 3 files changed, 42 insertions(+) create mode 100644 configs/model/Qwen2.5-1.5B-Instruct.yaml create mode 100644 configs/model/Qwen2.5-3B-Instruct.yaml create mode 100644 configs/model/Qwen2.5-7B-Instruct.yaml diff --git a/configs/model/Qwen2.5-1.5B-Instruct.yaml b/configs/model/Qwen2.5-1.5B-Instruct.yaml new file mode 100644 index 0000000..803fe1d --- /dev/null +++ b/configs/model/Qwen2.5-1.5B-Instruct.yaml @@ -0,0 +1,14 @@ +model_args: + pretrained_model_name_or_path: "Qwen/Qwen2.5-1.5B-Instruct" + attn_implementation: 'flash_attention_2' + torch_dtype: bfloat16 +tokenizer_args: + pretrained_model_name_or_path: "Qwen/Qwen2.5-1.5B-Instruct" +template_args: + apply_chat_template: true + system_prompt: "You are a helpful assistant." + system_prompt_with_special_tokens: "<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n" + user_start_tag: "<|im_start|>user\n" + user_end_tag: "<|im_end|>\n" + asst_start_tag: "<|im_start|>assistant\n" + asst_end_tag: "<|im_end|>\n" diff --git a/configs/model/Qwen2.5-3B-Instruct.yaml b/configs/model/Qwen2.5-3B-Instruct.yaml new file mode 100644 index 0000000..0f903fe --- /dev/null +++ b/configs/model/Qwen2.5-3B-Instruct.yaml @@ -0,0 +1,14 @@ +model_args: + pretrained_model_name_or_path: "Qwen/Qwen2.5-3B-Instruct" + attn_implementation: 'flash_attention_2' + torch_dtype: bfloat16 +tokenizer_args: + pretrained_model_name_or_path: "Qwen/Qwen2.5-3B-Instruct" +template_args: + apply_chat_template: true + system_prompt: "You are a helpful assistant." + system_prompt_with_special_tokens: "<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n" + user_start_tag: "<|im_start|>user\n" + user_end_tag: "<|im_end|>\n" + asst_start_tag: "<|im_start|>assistant\n" + asst_end_tag: "<|im_end|>\n" \ No newline at end of file diff --git a/configs/model/Qwen2.5-7B-Instruct.yaml b/configs/model/Qwen2.5-7B-Instruct.yaml new file mode 100644 index 0000000..c9b292f --- /dev/null +++ b/configs/model/Qwen2.5-7B-Instruct.yaml @@ -0,0 +1,14 @@ +model_args: + pretrained_model_name_or_path: "Qwen/Qwen2.5-7B-Instruct" + attn_implementation: 'flash_attention_2' + torch_dtype: bfloat16 +tokenizer_args: + pretrained_model_name_or_path: "Qwen/Qwen2.5-7B-Instruct" +template_args: + apply_chat_template: true + system_prompt: "You are a helpful assistant." + system_prompt_with_special_tokens: "<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n" + user_start_tag: "<|im_start|>user\n" + user_end_tag: "<|im_end|>\n" + asst_start_tag: "<|im_start|>assistant\n" + asst_end_tag: "<|im_end|>\n"