diff --git a/scripts/gpt_oss_20b_post/inc_output_hooks_maxabs_0_1.json b/scripts/gpt_oss_20b_post/inc_output_hooks_maxabs_0_1.json new file mode 100755 index 000000000000..651a93aaf805 --- /dev/null +++ b/scripts/gpt_oss_20b_post/inc_output_hooks_maxabs_0_1.json @@ -0,0 +1,32023 @@ +{ + "GlobalRank": null, + "LocalRank": 0, + "Mode": "DynamicRange", + "Nodes": { + "model.layers.0.attn.qkv": { + "inputs": [ + [ + [ + 40.75 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.0.attn.o_proj": { + "inputs": [ + [ + [ + 11.0625 + ] + ] + ], + "outputs": [ + [ + [ + 68.0 + ] + ], + [ + [ + 2.3235528441943354e+35 + ] + ] + ], + "params": { + "weight": [ + [ + 3.15625 + ] + ] + } + }, + "model.layers.0.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 2.203125 + ] + ], + [ + [ + 95.5 + ] + ] + ] + }, + "model.layers.0.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 11.0625 + ] + ] + ] + }, + "model.layers.0.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 2.203125 + ] + ] + ] + }, + "model.layers.0.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 9.75 + ] + ] + ] + }, + "model.layers.0.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 95.5 + ] + ] + ] + }, + "model.layers.0.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 11.0625 + ] + ] + ] + }, + "model.layers.0.mlp.router": { + "inputs": [ + [ + [ + 9.1875 + ] + ] + ], + "params": { + "weight": [ + [ + 0.2353515625 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 9.1875 + ] + ] + ], + "outputs": [ + [ + [ + 230.0 + ] + ], + [ + [ + 52.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 53.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 50.0 + ] + ], + [ + [ + 55.75 + ] + ], + [ + [ + 38.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 48.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ] + ] + }, + "model.layers.0.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.0.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.1.attn.qkv": { + "inputs": [ + [ + [ + 36.5 + ] + ] + ], + "params": { + "weight": [ + [ + 2.71875 + ] + ] + } + }, + "model.layers.1.attn.o_proj": { + "inputs": [ + [ + [ + 9.875 + ] + ] + ], + "outputs": [ + [ + [ + 82.0 + ] + ], + [ + [ + 2.3884565549260207e+35 + ] + ] + ], + "params": { + "weight": [ + [ + 4.5 + ] + ] + } + }, + "model.layers.1.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 2.515625 + ] + ], + [ + [ + 166.0 + ] + ] + ] + }, + "model.layers.1.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 10.0 + ] + ] + ] + }, + "model.layers.1.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 2.515625 + ] + ] + ] + }, + "model.layers.1.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 6.03125 + ] + ] + ] + }, + "model.layers.1.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 166.0 + ] + ] + ] + }, + "model.layers.1.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 10.0 + ] + ] + ] + }, + "model.layers.1.mlp.router": { + "inputs": [ + [ + [ + 6.0625 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1455078125 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 6.0625 + ] + ] + ], + "outputs": [ + [ + [ + 229.0 + ] + ], + [ + [ + 39.25 + ] + ], + [ + [ + 49.75 + ] + ], + [ + [ + 46.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 52.5 + ] + ], + [ + [ + 55.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 46.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 50.0 + ] + ], + [ + [ + 53.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 54.25 + ] + ], + [ + [ + 45.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 50.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 54.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 45.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 51.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ] + ] + }, + "model.layers.1.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.1.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.2.attn.qkv": { + "inputs": [ + [ + [ + 37.5 + ] + ] + ], + "params": { + "weight": [ + [ + 0.84375 + ] + ] + } + }, + "model.layers.2.attn.o_proj": { + "inputs": [ + [ + [ + 14.125 + ] + ] + ], + "outputs": [ + [ + [ + 84.0 + ] + ], + [ + [ + 2.679225179003971e+36 + ] + ] + ], + "params": { + "weight": [ + [ + 12.625 + ] + ] + } + }, + "model.layers.2.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 2.515625 + ] + ], + [ + [ + 45.25 + ] + ] + ] + }, + "model.layers.2.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 14.125 + ] + ] + ] + }, + "model.layers.2.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 2.515625 + ] + ] + ] + }, + "model.layers.2.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 8.5 + ] + ] + ] + }, + "model.layers.2.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 45.25 + ] + ] + ] + }, + "model.layers.2.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 14.125 + ] + ] + ] + }, + "model.layers.2.mlp.router": { + "inputs": [ + [ + [ + 7.125 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1572265625 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 7.125 + ] + ] + ], + "outputs": [ + [ + [ + 217.0 + ] + ], + [ + [ + 42.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 47.5 + ] + ], + [ + [ + 35.5 + ] + ], + [ + [ + 46.0 + ] + ], + [ + [ + 39.75 + ] + ], + [ + [ + 43.25 + ] + ], + [ + [ + 47.5 + ] + ], + [ + [ + 50.0 + ] + ], + [ + [ + 54.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 38.5 + ] + ], + [ + [ + 48.5 + ] + ], + [ + [ + 50.5 + ] + ], + [ + [ + 35.75 + ] + ], + [ + [ + 55.25 + ] + ], + [ + [ + 52.5 + ] + ], + [ + [ + 55.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 51.0 + ] + ], + [ + [ + 49.5 + ] + ], + [ + [ + 33.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 54.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 46.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 54.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 43.75 + ] + ], + [ + [ + 55.25 + ] + ] + ] + }, + "model.layers.2.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.2.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.3.attn.qkv": { + "inputs": [ + [ + [ + 76.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.484375 + ] + ] + } + }, + "model.layers.3.attn.o_proj": { + "inputs": [ + [ + [ + 8.8125 + ] + ] + ], + "outputs": [ + [ + [ + 108.0 + ] + ], + [ + [ + 1.3159357158270667e+38 + ] + ] + ], + "params": { + "weight": [ + [ + 14.25 + ] + ] + } + }, + "model.layers.3.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 2.21875 + ] + ], + [ + [ + 124.0 + ] + ] + ] + }, + "model.layers.3.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 16.25 + ] + ] + ] + }, + "model.layers.3.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 2.21875 + ] + ] + ] + }, + "model.layers.3.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 5.59375 + ] + ] + ] + }, + "model.layers.3.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 124.0 + ] + ] + ] + }, + "model.layers.3.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 16.25 + ] + ] + ] + }, + "model.layers.3.mlp.router": { + "inputs": [ + [ + [ + 8.8125 + ] + ] + ], + "params": { + "weight": [ + [ + 0.126953125 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 8.8125 + ] + ] + ], + "outputs": [ + [ + [ + 188.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 53.0 + ] + ], + [ + [ + 31.875 + ] + ], + [ + [ + 48.0 + ] + ], + [ + [ + 42.0 + ] + ], + [ + [ + 50.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 45.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 50.0 + ] + ], + [ + [ + 36.25 + ] + ], + [ + [ + 44.75 + ] + ], + [ + [ + 43.5 + ] + ], + [ + [ + 48.0 + ] + ], + [ + [ + 45.0 + ] + ], + [ + [ + 53.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 53.5 + ] + ], + [ + [ + 51.0 + ] + ], + [ + [ + 53.0 + ] + ], + [ + [ + 53.75 + ] + ], + [ + [ + 44.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 51.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 42.5 + ] + ], + [ + [ + 55.0 + ] + ] + ] + }, + "model.layers.3.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.3.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.4.attn.qkv": { + "inputs": [ + [ + [ + 51.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.109375 + ] + ] + } + }, + "model.layers.4.attn.o_proj": { + "inputs": [ + [ + [ + 21.0 + ] + ] + ], + "outputs": [ + [ + [ + 96.0 + ] + ], + [ + [ + 2.3105721020479983e+35 + ] + ] + ], + "params": { + "weight": [ + [ + 6.8125 + ] + ] + } + }, + "model.layers.4.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 2.984375 + ] + ], + [ + [ + 147.0 + ] + ] + ] + }, + "model.layers.4.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 23.5 + ] + ] + ] + }, + "model.layers.4.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 2.984375 + ] + ] + ] + }, + "model.layers.4.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 17.125 + ] + ] + ] + }, + "model.layers.4.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 148.0 + ] + ] + ] + }, + "model.layers.4.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 23.5 + ] + ] + ] + }, + "model.layers.4.mlp.router": { + "inputs": [ + [ + [ + 10.375 + ] + ] + ], + "params": { + "weight": [ + [ + 0.158203125 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 10.375 + ] + ] + ], + "outputs": [ + [ + [ + 205.0 + ] + ], + [ + [ + 42.0 + ] + ], + [ + [ + 47.0 + ] + ], + [ + [ + 41.25 + ] + ], + [ + [ + 42.0 + ] + ], + [ + [ + 48.0 + ] + ], + [ + [ + 49.0 + ] + ], + [ + [ + 43.75 + ] + ], + [ + [ + 53.5 + ] + ], + [ + [ + 45.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 37.25 + ] + ], + [ + [ + 38.5 + ] + ], + [ + [ + 46.0 + ] + ], + [ + [ + 48.0 + ] + ], + [ + [ + 51.0 + ] + ], + [ + [ + 45.0 + ] + ], + [ + [ + 45.75 + ] + ], + [ + [ + 55.5 + ] + ], + [ + [ + 42.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 43.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 50.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 52.0 + ] + ], + [ + [ + 49.75 + ] + ], + [ + [ + 42.5 + ] + ], + [ + [ + 53.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 36.75 + ] + ], + [ + [ + 53.0 + ] + ] + ] + }, + "model.layers.4.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.4.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.5.attn.qkv": { + "inputs": [ + [ + [ + 44.5 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0859375 + ] + ] + } + }, + "model.layers.5.attn.o_proj": { + "inputs": [ + [ + [ + 11.1875 + ] + ] + ], + "outputs": [ + [ + [ + 130.0 + ] + ], + [ + [ + 708669603840.0 + ] + ] + ], + "params": { + "weight": [ + [ + 17.875 + ] + ] + } + }, + "model.layers.5.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 4.28125 + ] + ], + [ + [ + 70.5 + ] + ] + ] + }, + "model.layers.5.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 14.25 + ] + ] + ] + }, + "model.layers.5.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 4.28125 + ] + ] + ] + }, + "model.layers.5.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 8.3125 + ] + ] + ] + }, + "model.layers.5.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 70.5 + ] + ] + ] + }, + "model.layers.5.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 14.25 + ] + ] + ] + }, + "model.layers.5.mlp.router": { + "inputs": [ + [ + [ + 9.375 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1455078125 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 9.375 + ] + ] + ], + "outputs": [ + [ + [ + 310.0 + ] + ], + [ + [ + 30.125 + ] + ], + [ + [ + 46.5 + ] + ], + [ + [ + 34.0 + ] + ], + [ + [ + 55.75 + ] + ], + [ + [ + 48.25 + ] + ], + [ + [ + 47.75 + ] + ], + [ + [ + 44.75 + ] + ], + [ + [ + 33.5 + ] + ], + [ + [ + 42.0 + ] + ], + [ + [ + 45.5 + ] + ], + [ + [ + 24.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 40.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 48.5 + ] + ], + [ + [ + 50.5 + ] + ], + [ + [ + 44.5 + ] + ], + [ + [ + 34.0 + ] + ], + [ + [ + 52.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 53.5 + ] + ], + [ + [ + 41.25 + ] + ], + [ + [ + 45.0 + ] + ], + [ + [ + 41.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 40.0 + ] + ], + [ + [ + 44.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 51.25 + ] + ] + ] + }, + "model.layers.5.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 16.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.5.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.6.attn.qkv": { + "inputs": [ + [ + [ + 48.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.03125 + ] + ] + } + }, + "model.layers.6.attn.o_proj": { + "inputs": [ + [ + [ + 11.8125 + ] + ] + ], + "outputs": [ + [ + [ + 158.0 + ] + ], + [ + [ + 2.1288417119992793e+35 + ] + ] + ], + "params": { + "weight": [ + [ + 5.34375 + ] + ] + } + }, + "model.layers.6.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 5.0 + ] + ], + [ + [ + 55.5 + ] + ] + ] + }, + "model.layers.6.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 12.5 + ] + ] + ] + }, + "model.layers.6.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 5.0 + ] + ] + ] + }, + "model.layers.6.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 10.5 + ] + ] + ] + }, + "model.layers.6.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 55.5 + ] + ] + ] + }, + "model.layers.6.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 12.5 + ] + ] + ] + }, + "model.layers.6.mlp.router": { + "inputs": [ + [ + [ + 23.5 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 23.5 + ] + ] + ], + "outputs": [ + [ + [ + 42240.0 + ] + ], + [ + [ + 50.5 + ] + ], + [ + [ + 40.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 30.25 + ] + ], + [ + [ + 37.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 51.25 + ] + ], + [ + [ + 45.5 + ] + ], + [ + [ + 40.0 + ] + ], + [ + [ + 53.25 + ] + ], + [ + [ + 31.625 + ] + ], + [ + [ + 38.5 + ] + ], + [ + [ + 40.5 + ] + ], + [ + [ + 42.75 + ] + ], + [ + [ + 43.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 44.75 + ] + ], + [ + [ + 29.875 + ] + ], + [ + [ + 43.5 + ] + ], + [ + [ + 39.75 + ] + ], + [ + [ + 46.0 + ] + ], + [ + [ + 24.375 + ] + ], + [ + [ + 30.5 + ] + ], + [ + [ + 49.25 + ] + ], + [ + [ + 39.25 + ] + ], + [ + [ + 50.0 + ] + ], + [ + [ + 38.25 + ] + ], + [ + [ + 53.0 + ] + ], + [ + [ + 45.5 + ] + ], + [ + [ + 44.25 + ] + ], + [ + [ + 32.5 + ] + ], + [ + [ + 37.75 + ] + ] + ] + }, + "model.layers.6.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.6.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.7.attn.qkv": { + "inputs": [ + [ + [ + 195.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.75 + ] + ] + } + }, + "model.layers.7.attn.o_proj": { + "inputs": [ + [ + [ + 11.375 + ] + ] + ], + "outputs": [ + [ + [ + 217.0 + ] + ], + [ + [ + 1683627180032.0 + ] + ] + ], + "params": { + "weight": [ + [ + 13.0 + ] + ] + } + }, + "model.layers.7.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 2.34375 + ] + ], + [ + [ + 195.0 + ] + ] + ] + }, + "model.layers.7.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 17.125 + ] + ] + ] + }, + "model.layers.7.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 2.34375 + ] + ] + ] + }, + "model.layers.7.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 10.625 + ] + ] + ] + }, + "model.layers.7.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 195.0 + ] + ] + ] + }, + "model.layers.7.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 17.125 + ] + ] + ] + }, + "model.layers.7.mlp.router": { + "inputs": [ + [ + [ + 77.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.16796875 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 77.0 + ] + ] + ], + "outputs": [ + [ + [ + 400.0 + ] + ], + [ + [ + 24.5 + ] + ], + [ + [ + 39.75 + ] + ], + [ + [ + 48.5 + ] + ], + [ + [ + 43.25 + ] + ], + [ + [ + 25.0 + ] + ], + [ + [ + 54.0 + ] + ], + [ + [ + 35.25 + ] + ], + [ + [ + 46.0 + ] + ], + [ + [ + 39.75 + ] + ], + [ + [ + 44.25 + ] + ], + [ + [ + 45.25 + ] + ], + [ + [ + 24.25 + ] + ], + [ + [ + 27.75 + ] + ], + [ + [ + 43.5 + ] + ], + [ + [ + 27.625 + ] + ], + [ + [ + 39.25 + ] + ], + [ + [ + 36.75 + ] + ], + [ + [ + 31.0 + ] + ], + [ + [ + 39.75 + ] + ], + [ + [ + 35.5 + ] + ], + [ + [ + 49.25 + ] + ], + [ + [ + 26.875 + ] + ], + [ + [ + 40.5 + ] + ], + [ + [ + 50.25 + ] + ], + [ + [ + 26.625 + ] + ], + [ + [ + 30.75 + ] + ], + [ + [ + 44.5 + ] + ], + [ + [ + 30.75 + ] + ], + [ + [ + 32.0 + ] + ], + [ + [ + 43.75 + ] + ], + [ + [ + 35.0 + ] + ], + [ + [ + 22.875 + ] + ] + ] + }, + "model.layers.7.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.7.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.8.attn.qkv": { + "inputs": [ + [ + [ + 121.5 + ] + ] + ], + "params": { + "weight": [ + [ + 0.69921875 + ] + ] + } + }, + "model.layers.8.attn.o_proj": { + "inputs": [ + [ + [ + 14.9375 + ] + ] + ], + "outputs": [ + [ + [ + 222.0 + ] + ], + [ + [ + 2.3754758127796836e+35 + ] + ] + ], + "params": { + "weight": [ + [ + 5.65625 + ] + ] + } + }, + "model.layers.8.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 3.03125 + ] + ], + [ + [ + 49.5 + ] + ] + ] + }, + "model.layers.8.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 15.0 + ] + ] + ] + }, + "model.layers.8.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 3.03125 + ] + ] + ] + }, + "model.layers.8.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 13.375 + ] + ] + ] + }, + "model.layers.8.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 49.5 + ] + ] + ] + }, + "model.layers.8.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 15.0 + ] + ] + ] + }, + "model.layers.8.mlp.router": { + "inputs": [ + [ + [ + 57.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.177734375 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 57.0 + ] + ] + ], + "outputs": [ + [ + [ + 620.0 + ] + ], + [ + [ + 30.625 + ] + ], + [ + [ + 38.5 + ] + ], + [ + [ + 23.375 + ] + ], + [ + [ + 16.625 + ] + ], + [ + [ + 43.0 + ] + ], + [ + [ + 39.25 + ] + ], + [ + [ + 40.75 + ] + ], + [ + [ + 26.25 + ] + ], + [ + [ + 37.5 + ] + ], + [ + [ + 50.75 + ] + ], + [ + [ + 31.5 + ] + ], + [ + [ + 29.875 + ] + ], + [ + [ + 43.0 + ] + ], + [ + [ + 25.625 + ] + ], + [ + [ + 23.25 + ] + ], + [ + [ + 31.125 + ] + ], + [ + [ + 27.875 + ] + ], + [ + [ + 23.125 + ] + ], + [ + [ + 39.75 + ] + ], + [ + [ + 34.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 24.625 + ] + ], + [ + [ + 25.0 + ] + ], + [ + [ + 45.0 + ] + ], + [ + [ + 24.5 + ] + ], + [ + [ + 34.75 + ] + ], + [ + [ + 35.25 + ] + ], + [ + [ + 46.75 + ] + ], + [ + [ + 26.75 + ] + ], + [ + [ + 22.625 + ] + ], + [ + [ + 27.25 + ] + ], + [ + [ + 25.125 + ] + ] + ] + }, + "model.layers.8.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 48.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.8.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.9.attn.qkv": { + "inputs": [ + [ + [ + 207.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0625 + ] + ] + } + }, + "model.layers.9.attn.o_proj": { + "inputs": [ + [ + [ + 12.0625 + ] + ] + ], + "outputs": [ + [ + [ + 820.0 + ] + ], + [ + [ + 5.399988732876221e+36 + ] + ] + ], + "params": { + "weight": [ + [ + 53.75 + ] + ] + } + }, + "model.layers.9.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 3.640625 + ] + ], + [ + [ + 89.0 + ] + ] + ] + }, + "model.layers.9.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 27.75 + ] + ] + ] + }, + "model.layers.9.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 3.640625 + ] + ] + ] + }, + "model.layers.9.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 11.625 + ] + ] + ] + }, + "model.layers.9.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 89.0 + ] + ] + ] + }, + "model.layers.9.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 27.75 + ] + ] + ] + }, + "model.layers.9.mlp.router": { + "inputs": [ + [ + [ + 64.5 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1689453125 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 64.5 + ] + ] + ], + "outputs": [ + [ + [ + 1224.0 + ] + ], + [ + [ + 33.75 + ] + ], + [ + [ + 52.0 + ] + ], + [ + [ + 32.5 + ] + ], + [ + [ + 25.375 + ] + ], + [ + [ + 55.5 + ] + ], + [ + [ + 33.0 + ] + ], + [ + [ + 33.25 + ] + ], + [ + [ + 35.5 + ] + ], + [ + [ + 39.5 + ] + ], + [ + [ + 40.0 + ] + ], + [ + [ + 29.5 + ] + ], + [ + [ + 26.875 + ] + ], + [ + [ + 38.25 + ] + ], + [ + [ + 27.75 + ] + ], + [ + [ + 40.25 + ] + ], + [ + [ + 42.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 30.375 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 25.875 + ] + ], + [ + [ + 44.5 + ] + ], + [ + [ + 37.0 + ] + ], + [ + [ + 22.25 + ] + ], + [ + [ + 41.5 + ] + ], + [ + [ + 41.5 + ] + ], + [ + [ + 35.25 + ] + ], + [ + [ + 49.25 + ] + ], + [ + [ + 32.25 + ] + ], + [ + [ + 46.5 + ] + ], + [ + [ + 25.5 + ] + ], + [ + [ + 33.75 + ] + ], + [ + [ + 56.0 + ] + ] + ] + }, + "model.layers.9.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 32.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.9.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.10.attn.qkv": { + "inputs": [ + [ + [ + 109.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.78125 + ] + ] + } + }, + "model.layers.10.attn.o_proj": { + "inputs": [ + [ + [ + 17.625 + ] + ] + ], + "outputs": [ + [ + [ + 476.0 + ] + ], + [ + [ + 1.136489936396103e+38 + ] + ] + ], + "params": { + "weight": [ + [ + 24.0 + ] + ] + } + }, + "model.layers.10.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 3.40625 + ] + ], + [ + [ + 79.0 + ] + ] + ] + }, + "model.layers.10.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 19.0 + ] + ] + ] + }, + "model.layers.10.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 3.40625 + ] + ] + ] + }, + "model.layers.10.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 17.625 + ] + ] + ] + }, + "model.layers.10.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 79.0 + ] + ] + ] + }, + "model.layers.10.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 19.0 + ] + ] + ] + }, + "model.layers.10.mlp.router": { + "inputs": [ + [ + [ + 47.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1865234375 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 47.0 + ] + ] + ], + "outputs": [ + [ + [ + 1136.0 + ] + ], + [ + [ + 38.5 + ] + ], + [ + [ + 25.5 + ] + ], + [ + [ + 25.875 + ] + ], + [ + [ + 31.375 + ] + ], + [ + [ + 21.25 + ] + ], + [ + [ + 34.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 24.25 + ] + ], + [ + [ + 47.0 + ] + ], + [ + [ + 29.0 + ] + ], + [ + [ + 54.0 + ] + ], + [ + [ + 24.875 + ] + ], + [ + [ + 33.75 + ] + ], + [ + [ + 38.5 + ] + ], + [ + [ + 33.75 + ] + ], + [ + [ + 43.5 + ] + ], + [ + [ + 24.875 + ] + ], + [ + [ + 27.5 + ] + ], + [ + [ + 31.875 + ] + ], + [ + [ + 44.25 + ] + ], + [ + [ + 28.375 + ] + ], + [ + [ + 30.5 + ] + ], + [ + [ + 21.75 + ] + ], + [ + [ + 20.125 + ] + ], + [ + [ + 44.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 42.25 + ] + ], + [ + [ + 33.5 + ] + ], + [ + [ + 53.5 + ] + ], + [ + [ + 55.0 + ] + ], + [ + [ + 44.75 + ] + ], + [ + [ + 29.5 + ] + ] + ] + }, + "model.layers.10.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.10.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.attn.qkv": { + "inputs": [ + [ + [ + 191.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.62890625 + ] + ] + } + }, + "model.layers.11.attn.o_proj": { + "inputs": [ + [ + [ + 21.625 + ] + ] + ], + "outputs": [ + [ + [ + 668.0 + ] + ], + [ + [ + 2.3105721020479983e+35 + ] + ] + ], + "params": { + "weight": [ + [ + 11.4375 + ] + ] + } + }, + "model.layers.11.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 3.03125 + ] + ], + [ + [ + 80.0 + ] + ] + ] + }, + "model.layers.11.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 21.125 + ] + ] + ] + }, + "model.layers.11.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 3.03125 + ] + ] + ] + }, + "model.layers.11.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 15.1875 + ] + ] + ] + }, + "model.layers.11.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 80.0 + ] + ] + ] + }, + "model.layers.11.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 22.125 + ] + ] + ] + }, + "model.layers.11.mlp.router": { + "inputs": [ + [ + [ + 79.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.177734375 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 79.0 + ] + ] + ], + "outputs": [ + [ + [ + 688.0 + ] + ], + [ + [ + 34.5 + ] + ], + [ + [ + 35.5 + ] + ], + [ + [ + 26.25 + ] + ], + [ + [ + 29.375 + ] + ], + [ + [ + 32.5 + ] + ], + [ + [ + 43.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 23.625 + ] + ], + [ + [ + 27.625 + ] + ], + [ + [ + 32.25 + ] + ], + [ + [ + 25.75 + ] + ], + [ + [ + 30.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 19.25 + ] + ], + [ + [ + 32.0 + ] + ], + [ + [ + 48.75 + ] + ], + [ + [ + 39.0 + ] + ], + [ + [ + 22.75 + ] + ], + [ + [ + 39.5 + ] + ], + [ + [ + 39.75 + ] + ], + [ + [ + 42.0 + ] + ], + [ + [ + 36.5 + ] + ], + [ + [ + 42.5 + ] + ], + [ + [ + 39.0 + ] + ], + [ + [ + 25.375 + ] + ], + [ + [ + 46.75 + ] + ], + [ + [ + 36.75 + ] + ], + [ + [ + 18.75 + ] + ], + [ + [ + 39.5 + ] + ], + [ + [ + 22.125 + ] + ], + [ + [ + 32.75 + ] + ], + [ + [ + 30.0 + ] + ] + ] + }, + "model.layers.11.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.11.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.12.attn.qkv": { + "inputs": [ + [ + [ + 137.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.322265625 + ] + ] + } + }, + "model.layers.12.attn.o_proj": { + "inputs": [ + [ + [ + 21.0 + ] + ] + ], + "outputs": [ + [ + [ + 520.0 + ] + ], + [ + [ + 5.516296182507401e+37 + ] + ] + ], + "params": { + "weight": [ + [ + 19.25 + ] + ] + } + }, + "model.layers.12.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 3.265625 + ] + ], + [ + [ + 22.625 + ] + ] + ] + }, + "model.layers.12.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 27.0 + ] + ] + ] + }, + "model.layers.12.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 3.265625 + ] + ] + ] + }, + "model.layers.12.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 21.0 + ] + ] + ] + }, + "model.layers.12.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 22.625 + ] + ] + ] + }, + "model.layers.12.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 27.0 + ] + ] + ] + }, + "model.layers.12.mlp.router": { + "inputs": [ + [ + [ + 84.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1943359375 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 84.0 + ] + ] + ], + "outputs": [ + [ + [ + 2160.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 21.375 + ] + ], + [ + [ + 38.75 + ] + ], + [ + [ + 33.5 + ] + ], + [ + [ + 32.5 + ] + ], + [ + [ + 30.25 + ] + ], + [ + [ + 38.25 + ] + ], + [ + [ + 40.75 + ] + ], + [ + [ + 45.25 + ] + ], + [ + [ + 14.625 + ] + ], + [ + [ + 30.75 + ] + ], + [ + [ + 19.625 + ] + ], + [ + [ + 22.0 + ] + ], + [ + [ + 35.25 + ] + ], + [ + [ + 29.75 + ] + ], + [ + [ + 36.25 + ] + ], + [ + [ + 41.0 + ] + ], + [ + [ + 33.0 + ] + ], + [ + [ + 49.0 + ] + ], + [ + [ + 27.0 + ] + ], + [ + [ + 41.0 + ] + ], + [ + [ + 53.5 + ] + ], + [ + [ + 33.0 + ] + ], + [ + [ + 34.75 + ] + ], + [ + [ + 33.75 + ] + ], + [ + [ + 19.25 + ] + ], + [ + [ + 37.5 + ] + ], + [ + [ + 34.0 + ] + ], + [ + [ + 18.625 + ] + ], + [ + [ + 30.25 + ] + ], + [ + [ + 26.125 + ] + ], + [ + [ + 38.0 + ] + ] + ] + }, + "model.layers.12.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.12.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.13.attn.qkv": { + "inputs": [ + [ + [ + 183.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.546875 + ] + ] + } + }, + "model.layers.13.attn.o_proj": { + "inputs": [ + [ + [ + 22.125 + ] + ] + ], + "outputs": [ + [ + [ + 1240.0 + ] + ], + [ + [ + 2.1677839384382905e+35 + ] + ] + ], + "params": { + "weight": [ + [ + 20.375 + ] + ] + } + }, + "model.layers.13.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 3.015625 + ] + ], + [ + [ + 104.5 + ] + ] + ] + }, + "model.layers.13.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 21.875 + ] + ] + ] + }, + "model.layers.13.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 3.015625 + ] + ] + ] + }, + "model.layers.13.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 16.75 + ] + ] + ] + }, + "model.layers.13.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 104.5 + ] + ] + ] + }, + "model.layers.13.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 22.625 + ] + ] + ] + }, + "model.layers.13.mlp.router": { + "inputs": [ + [ + [ + 86.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1396484375 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 86.0 + ] + ] + ], + "outputs": [ + [ + [ + 796.0 + ] + ], + [ + [ + 42.0 + ] + ], + [ + [ + 39.5 + ] + ], + [ + [ + 27.375 + ] + ], + [ + [ + 40.25 + ] + ], + [ + [ + 28.625 + ] + ], + [ + [ + 44.5 + ] + ], + [ + [ + 34.0 + ] + ], + [ + [ + 20.25 + ] + ], + [ + [ + 49.5 + ] + ], + [ + [ + 53.25 + ] + ], + [ + [ + 47.25 + ] + ], + [ + [ + 29.25 + ] + ], + [ + [ + 27.5 + ] + ], + [ + [ + 36.0 + ] + ], + [ + [ + 34.5 + ] + ], + [ + [ + 21.0 + ] + ], + [ + [ + 29.125 + ] + ], + [ + [ + 25.625 + ] + ], + [ + [ + 38.75 + ] + ], + [ + [ + 28.875 + ] + ], + [ + [ + 34.5 + ] + ], + [ + [ + 34.25 + ] + ], + [ + [ + 33.5 + ] + ], + [ + [ + 25.125 + ] + ], + [ + [ + 29.5 + ] + ], + [ + [ + 43.75 + ] + ], + [ + [ + 46.75 + ] + ], + [ + [ + 51.5 + ] + ], + [ + [ + 25.625 + ] + ], + [ + [ + 43.0 + ] + ], + [ + [ + 46.0 + ] + ], + [ + [ + 41.0 + ] + ] + ] + }, + "model.layers.13.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.13.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.14.attn.qkv": { + "inputs": [ + [ + [ + 148.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5859375 + ] + ] + } + }, + "model.layers.14.attn.o_proj": { + "inputs": [ + [ + [ + 32.0 + ] + ] + ], + "outputs": [ + [ + [ + 628.0 + ] + ], + [ + [ + 2.1677839384382905e+35 + ] + ] + ], + "params": { + "weight": [ + [ + 9.1875 + ] + ] + } + }, + "model.layers.14.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 8.9375 + ] + ], + [ + [ + 74.5 + ] + ] + ] + }, + "model.layers.14.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 34.5 + ] + ] + ] + }, + "model.layers.14.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 8.9375 + ] + ] + ] + }, + "model.layers.14.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 29.125 + ] + ] + ] + }, + "model.layers.14.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 74.5 + ] + ] + ] + }, + "model.layers.14.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 34.5 + ] + ] + ] + }, + "model.layers.14.mlp.router": { + "inputs": [ + [ + [ + 99.5 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1630859375 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 99.5 + ] + ] + ], + "outputs": [ + [ + [ + 1456.0 + ] + ], + [ + [ + 44.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 37.5 + ] + ], + [ + [ + 42.25 + ] + ], + [ + [ + 27.875 + ] + ], + [ + [ + 34.75 + ] + ], + [ + [ + 40.75 + ] + ], + [ + [ + 28.125 + ] + ], + [ + [ + 26.5 + ] + ], + [ + [ + 28.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 28.75 + ] + ], + [ + [ + 42.5 + ] + ], + [ + [ + 16.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 40.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 31.5 + ] + ], + [ + [ + 31.875 + ] + ], + [ + [ + 53.5 + ] + ], + [ + [ + 31.125 + ] + ], + [ + [ + 27.0 + ] + ], + [ + [ + 25.5 + ] + ], + [ + [ + 45.0 + ] + ], + [ + [ + 28.125 + ] + ], + [ + [ + 33.25 + ] + ], + [ + [ + 34.25 + ] + ], + [ + [ + 24.375 + ] + ], + [ + [ + 24.25 + ] + ], + [ + [ + 46.0 + ] + ], + [ + [ + 28.5 + ] + ], + [ + [ + 27.875 + ] + ] + ] + }, + "model.layers.14.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.14.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.15.attn.qkv": { + "inputs": [ + [ + [ + 164.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.546875 + ] + ] + } + }, + "model.layers.15.attn.o_proj": { + "inputs": [ + [ + [ + 26.375 + ] + ] + ], + "outputs": [ + [ + [ + 2224.0 + ] + ], + [ + [ + 2.3105721020479983e+35 + ] + ] + ], + "params": { + "weight": [ + [ + 18.25 + ] + ] + } + }, + "model.layers.15.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 4.3125 + ] + ], + [ + [ + 76.0 + ] + ] + ] + }, + "model.layers.15.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 48.25 + ] + ] + ] + }, + "model.layers.15.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 4.3125 + ] + ] + ] + }, + "model.layers.15.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 17.5 + ] + ] + ] + }, + "model.layers.15.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 76.0 + ] + ] + ] + }, + "model.layers.15.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 61.5 + ] + ] + ] + }, + "model.layers.15.mlp.router": { + "inputs": [ + [ + [ + 106.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1337890625 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 106.0 + ] + ] + ], + "outputs": [ + [ + [ + 976.0 + ] + ], + [ + [ + 36.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 21.0 + ] + ], + [ + [ + 27.875 + ] + ], + [ + [ + 35.75 + ] + ], + [ + [ + 39.5 + ] + ], + [ + [ + 20.5 + ] + ], + [ + [ + 32.25 + ] + ], + [ + [ + 31.75 + ] + ], + [ + [ + 24.875 + ] + ], + [ + [ + 42.25 + ] + ], + [ + [ + 49.75 + ] + ], + [ + [ + 46.0 + ] + ], + [ + [ + 24.75 + ] + ], + [ + [ + 31.875 + ] + ], + [ + [ + 29.0 + ] + ], + [ + [ + 24.375 + ] + ], + [ + [ + 29.375 + ] + ], + [ + [ + 47.75 + ] + ], + [ + [ + 53.0 + ] + ], + [ + [ + 42.0 + ] + ], + [ + [ + 34.5 + ] + ], + [ + [ + 36.75 + ] + ], + [ + [ + 21.5 + ] + ], + [ + [ + 43.25 + ] + ], + [ + [ + 45.75 + ] + ], + [ + [ + 42.0 + ] + ], + [ + [ + 48.0 + ] + ], + [ + [ + 31.625 + ] + ], + [ + [ + 39.5 + ] + ], + [ + [ + 26.125 + ] + ], + [ + [ + 42.0 + ] + ] + ] + }, + "model.layers.15.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1875 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 64.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.15.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.16.attn.qkv": { + "inputs": [ + [ + [ + 131.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.671875 + ] + ] + } + }, + "model.layers.16.attn.o_proj": { + "inputs": [ + [ + [ + 32.25 + ] + ] + ], + "outputs": [ + [ + [ + 732.0 + ] + ], + [ + [ + 2.2067261648773017e+35 + ] + ] + ], + "params": { + "weight": [ + [ + 12.8125 + ] + ] + } + }, + "model.layers.16.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 5.5625 + ] + ], + [ + [ + 53.75 + ] + ] + ] + }, + "model.layers.16.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 34.5 + ] + ] + ] + }, + "model.layers.16.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 5.5625 + ] + ] + ] + }, + "model.layers.16.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 30.75 + ] + ] + ] + }, + "model.layers.16.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 53.75 + ] + ] + ] + }, + "model.layers.16.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 34.5 + ] + ] + ] + }, + "model.layers.16.mlp.router": { + "inputs": [ + [ + [ + 68.5 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1298828125 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 68.5 + ] + ] + ], + "outputs": [ + [ + [ + 2800.0 + ] + ], + [ + [ + 29.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 36.0 + ] + ], + [ + [ + 27.875 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 22.0 + ] + ], + [ + [ + 53.25 + ] + ], + [ + [ + 16.875 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 22.375 + ] + ], + [ + [ + 28.5 + ] + ], + [ + [ + 39.25 + ] + ], + [ + [ + 36.0 + ] + ], + [ + [ + 31.0 + ] + ], + [ + [ + 20.125 + ] + ], + [ + [ + 28.75 + ] + ], + [ + [ + 22.125 + ] + ], + [ + [ + 44.5 + ] + ], + [ + [ + 30.0 + ] + ], + [ + [ + 37.5 + ] + ], + [ + [ + 19.625 + ] + ], + [ + [ + 25.0 + ] + ], + [ + [ + 30.5 + ] + ], + [ + [ + 43.75 + ] + ], + [ + [ + 35.0 + ] + ], + [ + [ + 35.75 + ] + ], + [ + [ + 43.25 + ] + ], + [ + [ + 26.625 + ] + ], + [ + [ + 21.25 + ] + ], + [ + [ + 35.5 + ] + ], + [ + [ + 32.0 + ] + ] + ] + }, + "model.layers.16.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.16.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.17.attn.qkv": { + "inputs": [ + [ + [ + 125.5 + ] + ] + ], + "params": { + "weight": [ + [ + 0.765625 + ] + ] + } + }, + "model.layers.17.attn.o_proj": { + "inputs": [ + [ + [ + 16.75 + ] + ] + ], + "outputs": [ + [ + [ + 1808.0 + ] + ], + [ + [ + 2.3495143284870095e+35 + ] + ] + ], + "params": { + "weight": [ + [ + 18.625 + ] + ] + } + }, + "model.layers.17.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 5.71875 + ] + ], + [ + [ + 115.0 + ] + ] + ] + }, + "model.layers.17.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 24.375 + ] + ] + ] + }, + "model.layers.17.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 5.71875 + ] + ] + ] + }, + "model.layers.17.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 14.125 + ] + ] + ] + }, + "model.layers.17.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 115.0 + ] + ] + ] + }, + "model.layers.17.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 24.375 + ] + ] + ] + }, + "model.layers.17.mlp.router": { + "inputs": [ + [ + [ + 41.75 + ] + ] + ], + "params": { + "weight": [ + [ + 0.099609375 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 41.75 + ] + ] + ], + "outputs": [ + [ + [ + 41728.0 + ] + ], + [ + [ + 24.25 + ] + ], + [ + [ + 27.75 + ] + ], + [ + [ + 43.75 + ] + ], + [ + [ + 44.5 + ] + ], + [ + [ + 50.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 31.375 + ] + ], + [ + [ + 45.25 + ] + ], + [ + [ + 27.625 + ] + ], + [ + [ + 39.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 40.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 43.25 + ] + ], + [ + [ + 39.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 31.625 + ] + ], + [ + [ + 41.5 + ] + ], + [ + [ + 30.375 + ] + ], + [ + [ + 35.25 + ] + ], + [ + [ + 45.0 + ] + ], + [ + [ + 46.75 + ] + ], + [ + [ + 39.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 33.25 + ] + ], + [ + [ + 47.25 + ] + ], + [ + [ + 34.0 + ] + ], + [ + [ + 28.5 + ] + ], + [ + [ + 47.0 + ] + ], + [ + [ + 37.0 + ] + ], + [ + [ + 54.25 + ] + ] + ] + }, + "model.layers.17.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 96.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1024.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 128.0 + ] + ] + } + }, + "model.layers.17.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.18.attn.qkv": { + "inputs": [ + [ + [ + 53.75 + ] + ] + ], + "params": { + "weight": [ + [ + 2.671875 + ] + ] + } + }, + "model.layers.18.attn.o_proj": { + "inputs": [ + [ + [ + 30.75 + ] + ] + ], + "outputs": [ + [ + [ + 1528.0 + ] + ], + [ + [ + 2.3495143284870095e+35 + ] + ] + ], + "params": { + "weight": [ + [ + 16.5 + ] + ] + } + }, + "model.layers.18.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 5.75 + ] + ], + [ + [ + 75.0 + ] + ] + ] + }, + "model.layers.18.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 36.0 + ] + ] + ] + }, + "model.layers.18.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 5.75 + ] + ] + ] + }, + "model.layers.18.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 28.875 + ] + ] + ] + }, + "model.layers.18.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 75.0 + ] + ] + ] + }, + "model.layers.18.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 36.0 + ] + ] + ] + }, + "model.layers.18.mlp.router": { + "inputs": [ + [ + [ + 19.125 + ] + ] + ], + "params": { + "weight": [ + [ + 0.11865234375 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 19.125 + ] + ] + ], + "outputs": [ + [ + [ + 2944.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 53.5 + ] + ], + [ + [ + 34.75 + ] + ], + [ + [ + 30.375 + ] + ], + [ + [ + 47.25 + ] + ], + [ + [ + 40.0 + ] + ], + [ + [ + 39.0 + ] + ], + [ + [ + 51.25 + ] + ], + [ + [ + 52.75 + ] + ], + [ + [ + 27.75 + ] + ], + [ + [ + 24.5 + ] + ], + [ + [ + 46.25 + ] + ], + [ + [ + 34.0 + ] + ], + [ + [ + 30.875 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 22.125 + ] + ], + [ + [ + 35.25 + ] + ], + [ + [ + 44.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 41.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 51.5 + ] + ], + [ + [ + 45.5 + ] + ], + [ + [ + 54.0 + ] + ], + [ + [ + 40.0 + ] + ], + [ + [ + 39.5 + ] + ], + [ + [ + 29.75 + ] + ], + [ + [ + 23.375 + ] + ], + [ + [ + 35.5 + ] + ], + [ + [ + 53.75 + ] + ], + [ + [ + 52.25 + ] + ] + ] + }, + "model.layers.18.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 12.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2048.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 192.0 + ] + ] + } + }, + "model.layers.18.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.19.attn.qkv": { + "inputs": [ + [ + [ + 89.5 + ] + ] + ], + "params": { + "weight": [ + [ + 3.828125 + ] + ] + } + }, + "model.layers.19.attn.o_proj": { + "inputs": [ + [ + [ + 24.75 + ] + ] + ], + "outputs": [ + [ + [ + 2048.0 + ] + ], + [ + [ + 5.516296182507401e+37 + ] + ] + ], + "params": { + "weight": [ + [ + 56.75 + ] + ] + } + }, + "model.layers.19.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 3.8125 + ] + ], + [ + [ + 206.0 + ] + ] + ] + }, + "model.layers.19.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 29.5 + ] + ] + ] + }, + "model.layers.19.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 3.8125 + ] + ] + ] + }, + "model.layers.19.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 18.875 + ] + ] + ] + }, + "model.layers.19.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 206.0 + ] + ] + ] + }, + "model.layers.19.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 29.5 + ] + ] + ] + }, + "model.layers.19.mlp.router": { + "inputs": [ + [ + [ + 26.125 + ] + ] + ], + "params": { + "weight": [ + [ + 0.1474609375 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 26.125 + ] + ] + ], + "outputs": [ + [ + [ + 3376.0 + ] + ], + [ + [ + 46.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 36.5 + ] + ], + [ + [ + 39.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 55.75 + ] + ], + [ + [ + 33.5 + ] + ], + [ + [ + 47.75 + ] + ], + [ + [ + 22.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 46.25 + ] + ], + [ + [ + 46.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 49.25 + ] + ], + [ + [ + 31.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 54.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 33.0 + ] + ], + [ + [ + 53.5 + ] + ], + [ + [ + 32.5 + ] + ] + ] + }, + "model.layers.19.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1536.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.19.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.20.attn.qkv": { + "inputs": [ + [ + [ + 52.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.59375 + ] + ] + } + }, + "model.layers.20.attn.o_proj": { + "inputs": [ + [ + [ + 30.25 + ] + ] + ], + "outputs": [ + [ + [ + 1800.0 + ] + ], + [ + [ + 5.516296182507401e+37 + ] + ] + ], + "params": { + "weight": [ + [ + 38.0 + ] + ] + } + }, + "model.layers.20.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 4.84375 + ] + ], + [ + [ + 54.0 + ] + ] + ] + }, + "model.layers.20.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 35.25 + ] + ] + ] + }, + "model.layers.20.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 4.84375 + ] + ] + ] + }, + "model.layers.20.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 27.125 + ] + ] + ] + }, + "model.layers.20.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 54.0 + ] + ] + ] + }, + "model.layers.20.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 35.25 + ] + ] + ] + }, + "model.layers.20.mlp.router": { + "inputs": [ + [ + [ + 26.125 + ] + ] + ], + "params": { + "weight": [ + [ + 0.12890625 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 26.125 + ] + ] + ], + "outputs": [ + [ + [ + 6976.0 + ] + ], + [ + [ + 43.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 45.75 + ] + ], + [ + [ + 45.25 + ] + ], + [ + [ + 47.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 35.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 37.5 + ] + ], + [ + [ + 51.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 30.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 51.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 41.25 + ] + ], + [ + [ + 42.25 + ] + ], + [ + [ + 49.25 + ] + ], + [ + [ + 46.0 + ] + ], + [ + [ + 48.0 + ] + ], + [ + [ + 36.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 30.875 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 46.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 33.75 + ] + ], + [ + [ + 42.0 + ] + ], + [ + [ + 56.0 + ] + ] + ] + }, + "model.layers.20.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 6.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 8.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1536.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 256.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.20.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.21.attn.qkv": { + "inputs": [ + [ + [ + 82.5 + ] + ] + ], + "params": { + "weight": [ + [ + 8.5 + ] + ] + } + }, + "model.layers.21.attn.o_proj": { + "inputs": [ + [ + [ + 31.0 + ] + ] + ], + "outputs": [ + [ + [ + 5088.0 + ] + ], + [ + [ + 2.3105721020479983e+35 + ] + ] + ], + "params": { + "weight": [ + [ + 194.0 + ] + ] + } + }, + "model.layers.21.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 8.3125 + ] + ], + [ + [ + 205.0 + ] + ] + ] + }, + "model.layers.21.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 39.0 + ] + ] + ] + }, + "model.layers.21.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 8.3125 + ] + ] + ] + }, + "model.layers.21.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 30.125 + ] + ] + ] + }, + "model.layers.21.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 205.0 + ] + ] + ] + }, + "model.layers.21.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 39.0 + ] + ] + ] + }, + "model.layers.21.mlp.router": { + "inputs": [ + [ + [ + 35.75 + ] + ] + ], + "params": { + "weight": [ + [ + 0.12109375 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 35.75 + ] + ] + ], + "outputs": [ + [ + [ + 7264.0 + ] + ], + [ + [ + 42.0 + ] + ], + [ + [ + 47.0 + ] + ], + [ + [ + 42.5 + ] + ], + [ + [ + 39.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 41.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 22.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 54.5 + ] + ], + [ + [ + 52.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 51.5 + ] + ], + [ + [ + 34.5 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 51.5 + ] + ], + [ + [ + 47.0 + ] + ], + [ + [ + 45.5 + ] + ], + [ + [ + 37.0 + ] + ], + [ + [ + 28.375 + ] + ], + [ + [ + 52.5 + ] + ], + [ + [ + 42.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 38.5 + ] + ], + [ + [ + 51.25 + ] + ], + [ + [ + 46.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 50.5 + ] + ] + ] + }, + "model.layers.21.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1024.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1536.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1024.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2048.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2048.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1024.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1536.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1536.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.21.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.attn.qkv": { + "inputs": [ + [ + [ + 54.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.9375 + ] + ] + } + }, + "model.layers.22.attn.o_proj": { + "inputs": [ + [ + [ + 38.25 + ] + ] + ], + "outputs": [ + [ + [ + 3600.0 + ] + ], + [ + [ + 2.3495143284870095e+35 + ] + ] + ], + "params": { + "weight": [ + [ + 53.75 + ] + ] + } + }, + "model.layers.22.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 7.375 + ] + ], + [ + [ + 48.25 + ] + ] + ] + }, + "model.layers.22.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 53.5 + ] + ] + ] + }, + "model.layers.22.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 7.375 + ] + ] + ] + }, + "model.layers.22.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 30.125 + ] + ] + ] + }, + "model.layers.22.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 48.25 + ] + ] + ] + }, + "model.layers.22.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 53.5 + ] + ] + ] + }, + "model.layers.22.mlp.router": { + "inputs": [ + [ + [ + 30.25 + ] + ] + ], + "params": { + "weight": [ + [ + 0.16796875 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 30.25 + ] + ] + ], + "outputs": [ + [ + [ + 9088.0 + ] + ], + [ + [ + 33.5 + ] + ], + [ + [ + 48.75 + ] + ], + [ + [ + 47.0 + ] + ], + [ + [ + 48.5 + ] + ], + [ + [ + 44.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 32.5 + ] + ], + [ + [ + 43.0 + ] + ], + [ + [ + 32.5 + ] + ], + [ + [ + 38.5 + ] + ], + [ + [ + 44.5 + ] + ], + [ + [ + 31.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 37.0 + ] + ], + [ + [ + 49.5 + ] + ], + [ + [ + 55.25 + ] + ], + [ + [ + 31.875 + ] + ], + [ + [ + 37.0 + ] + ], + [ + [ + 38.5 + ] + ], + [ + [ + 42.0 + ] + ], + [ + [ + 51.5 + ] + ], + [ + [ + 39.75 + ] + ], + [ + [ + 39.75 + ] + ], + [ + [ + 36.0 + ] + ], + [ + [ + 35.75 + ] + ], + [ + [ + 48.75 + ] + ], + [ + [ + 41.5 + ] + ], + [ + [ + 50.0 + ] + ], + [ + [ + 31.75 + ] + ], + [ + [ + 33.75 + ] + ], + [ + [ + 32.25 + ] + ] + ] + }, + "model.layers.22.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.5 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.25 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.375 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3072.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1024.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1536.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1024.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1024.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1024.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.22.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.23.attn.qkv": { + "inputs": [ + [ + [ + 77.0 + ] + ] + ], + "params": { + "weight": [ + [ + 5.75 + ] + ] + } + }, + "model.layers.23.attn.o_proj": { + "inputs": [ + [ + [ + 57.75 + ] + ] + ], + "outputs": [ + [ + [ + 12032.0 + ] + ], + [ + [ + 1.0799977465752441e+37 + ] + ] + ], + "params": { + "weight": [ + [ + 197.0 + ] + ] + } + }, + "model.layers.23.attn.attn.impl.matmul_qk": { + "inputs": [ + [ + [ + 5.28125 + ] + ], + [ + [ + 137.0 + ] + ] + ] + }, + "model.layers.23.attn.attn.impl.matmul_av": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 60.5 + ] + ] + ] + }, + "model.layers.23.attn.attn.impl.batch2block_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 5.28125 + ] + ] + ] + }, + "model.layers.23.attn.attn.impl.block2batch_matmul": { + "inputs": [ + [ + [ + 1.0 + ] + ], + [ + [ + 47.75 + ] + ] + ] + }, + "model.layers.23.attn.attn.impl.k_cache": { + "inputs": [ + [ + [ + 137.0 + ] + ] + ] + }, + "model.layers.23.attn.attn.impl.v_cache": { + "inputs": [ + [ + [ + 60.5 + ] + ] + ] + }, + "model.layers.23.mlp.router": { + "inputs": [ + [ + [ + 60.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.16796875 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op": { + "inputs": [ + [ + [ + 60.0 + ] + ] + ], + "outputs": [ + [ + [ + 97792.0 + ] + ], + [ + [ + 37.5 + ] + ], + [ + [ + 49.5 + ] + ], + [ + [ + 54.25 + ] + ], + [ + [ + 24.75 + ] + ], + [ + [ + 50.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 39.75 + ] + ], + [ + [ + 32.5 + ] + ], + [ + [ + 53.5 + ] + ], + [ + [ + 40.0 + ] + ], + [ + [ + 38.75 + ] + ], + [ + [ + 45.5 + ] + ], + [ + [ + 37.0 + ] + ], + [ + [ + 51.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 52.25 + ] + ], + [ + [ + 52.25 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 28.25 + ] + ], + [ + [ + 52.75 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 36.25 + ] + ], + [ + [ + 37.75 + ] + ], + [ + [ + 53.25 + ] + ], + [ + [ + 37.0 + ] + ], + [ + [ + 33.5 + ] + ], + [ + [ + 49.75 + ] + ], + [ + [ + 38.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 56.0 + ] + ], + [ + [ + 43.0 + ] + ], + [ + [ + 54.25 + ] + ] + ] + }, + "model.layers.23.mlp.experts.moe_op.w13_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 0.75 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 3.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 4.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w13_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1.5 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.0": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.1": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.2": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.3": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.4": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1024.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.5": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.6": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.7": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.8": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2048.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.9": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.10": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.11": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.12": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 2048.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.13": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.14": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.15": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 384.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.16": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.17": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1024.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.18": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.19": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.20": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1024.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.21": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.22": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 768.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.23": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.24": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.25": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.26": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 1024.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.27": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.28": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.29": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.30": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + }, + "model.layers.23.mlp.experts.moe_op.w2_list.31": { + "inputs": [ + [ + [ + 0.0 + ] + ] + ], + "params": { + "weight": [ + [ + 512.0 + ] + ] + } + } + } +} \ No newline at end of file diff --git a/scripts/gpt_oss_20b_post/inc_output_hooks_maxabs_0_1.npz b/scripts/gpt_oss_20b_post/inc_output_hooks_maxabs_0_1.npz new file mode 100755 index 000000000000..7c25831ba2b0 Binary files /dev/null and b/scripts/gpt_oss_20b_post/inc_output_hooks_maxabs_0_1.npz differ diff --git a/scripts/quant_configs/inc_quant_fp8.json b/scripts/quant_configs/inc_quant_fp8.json new file mode 100644 index 000000000000..e088b08a5bf7 --- /dev/null +++ b/scripts/quant_configs/inc_quant_fp8.json @@ -0,0 +1,20 @@ +{ + "mode": "QUANTIZE", + "observer": "maxabs", + "scale_method": "maxabs_hw", + "scale_format": "scalar", + "allowlist": { + "types": [], + "names": [] + }, + "blocklist": { + "types": [ + ], + "names": [ + "fused_scaled_dot_product_attention", + "lm_head", + "mlp\\.gate\\b" + ] + }, + "dump_stats_path": "./gpt_oss_20b_post/inc_output" +} \ No newline at end of file diff --git a/scripts/run_basic_fp8.sh b/scripts/run_basic_fp8.sh new file mode 100644 index 000000000000..7d3bb4222b49 --- /dev/null +++ b/scripts/run_basic_fp8.sh @@ -0,0 +1,68 @@ +#!/bin/bash +QUANT_CONFIG_FILE="./quant_configs/inc_unit_scale.json" +timestamp=$(date +%Y%m%d_%H%M%S) +LOG_FILE="calib.pile.512.${timestamp}.log" + + +echo "Start INC calibration with model ${FP8_MODEL_PATH}, log file ${LOG_FILE}" + +model_path="/software/users/yiliu7/HF_HOME/lmsys/gpt-oss-20b-bf16" + +# model_path="/software/users/yiliu7/HF_HOME/lmsys/gpt-oss-120b-bf16" + +tp_size=1 +ep_size=1 +basename=$(basename $model_path) +is_120b=false +if [[ $basename == *"120b"* ]]; then + is_120b=true +fi + +export VLLM_BUILD=1.23.0.248 +export VLLM_BUILD=1.23.0.473 +export QUANT_CONFIG=./quant_configs/inc_unit_scale.json +export QUANT_CONFIG=./quant_configs/inc_quant_fp8.json +# export QUANT_CONFIG=./quant_configs/inc_quant.json +# export QUANT_CONFIG=./quant_configs/inc_measure.json + + +export INC_PT_ONLY=1 +nprompts=512 +nprompts=4 +# is 120b +if [ "$is_120b" = true ]; then + echo "Using model 120B, setting tp_size=4" + tp_size=4 + ep_size=1 + # export QUANT_CONFIG=./quant_configs/inc_quant_120b.json + # export QUANT_CONFIG=./quant_configs/inc_measure_120b.json + +else + echo "Using model 20B, setting tp_size=1" + tp_size=1 + ep_size=1 +fi + +# VLLM_PROMPT_USE_FUSEDSDPA=0 \ +# PT_HPU_GPT_MOE_WT_INTERLEAVED=1 \ +# VLLM_ENABLE_FUSED_MOE_WITH_BIAS=1 \ +PT_HPU_QKV_SLICE_SEQ_LEN_THLD=128 \ +PT_HPU_ENABLE_FUSED_SDPA_SINK=1 \ +PT_HPU_SDPA_QKV_SLICE_MODE_FWD=1 \ +PT_HPU_LAZY_MODE=1 \ +VLLM_DISABLE_MARK_SCALES_AS_CONST=1 \ +VLLM_LOGGING_LEVEL=DEBUG \ +PT_HPU_LAZY_MODE=1 \ +VLLM_SKIP_WARMUP=true python run_example_tp.py \ + --tp_size $tp_size \ + --ep_size $ep_size \ + --model $model_path \ + --osl 32 \ + --max_num_seqs 1 \ + --max_model_len 2048 \ + --tokenizer $model_path \ + --fp8_kv_cache \ + --nprompts $nprompts 2>&1 | tee $LOG_FILE + + +