From 29872387aac35961690394aea8ca04bc04dc35e3 Mon Sep 17 00:00:00 2001 From: Mingyu Cao <1054527636@qq.com> Date: Fri, 13 Dec 2024 17:31:58 +0800 Subject: [PATCH] fix --- tmp_files/modeling_deepseek_block_trim.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tmp_files/modeling_deepseek_block_trim.py b/tmp_files/modeling_deepseek_block_trim.py index 19d61a46c6..6f03f4fd9e 100644 --- a/tmp_files/modeling_deepseek_block_trim.py +++ b/tmp_files/modeling_deepseek_block_trim.py @@ -442,7 +442,7 @@ def backward(ctx, grad_output): # 层索引 to 专家索引序列 # current_dir = "/root/autodl-tmp/deepseek-ai/deepseek-moe-16b-base" -current_dir = '/mnt/fast/nobackup/users/ly0008/caomingyu/transformers/deepseek_model' +current_dir = '/home/work/mt_cmy/programs/CD-MoE/cd-moe/data' expert_order_path = os.path.join( current_dir, "layer_idx_to_expert_idx.greedy_jl.json") layer_idx_to_expert_idxs = json.load(open(expert_order_path, 'r'))