From d01ea9ddbc8942c6b516790b92a0046d37764c7a Mon Sep 17 00:00:00 2001 From: SolshineCode <143902425+SolshineCode@users.noreply.github.com> Date: Mon, 21 Oct 2024 02:22:31 -0700 Subject: [PATCH] Part 1 of qwen 2 compatibility: elif model_type qwen2 Line 27 added option for qwen2 architecture to be recognized: elif data['model_type'] == "qwen2": data['model_type'] = "mergedqwen2" data['architectures'][0] = 'MergedQwen2ForCausalLM ' This as part 1 of qwen 2 compatibility. --- dam/merge.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/dam/merge.py b/dam/merge.py index e972b33..639a38a 100644 --- a/dam/merge.py +++ b/dam/merge.py @@ -24,6 +24,9 @@ def fix_config(save_path, num_models, non_linearity, merge_embedding_layers, mer elif data['model_type'] == "llama": data['model_type'] = "mergedllama" data['architectures'][0] = 'MergedLlamaForCausalLM' + elif data['model_type'] == "qwen2": + data['model_type'] = "mergedqwen2" + data['architectures'][0] = 'MergedQwen2ForCausalLM ' data['num_merged_models'] = num_models data['non_linearity'] = non_linearity