Skip to content

Commit f54d377

Browse files
authored
Merge branch 'ikawrakow:main' into main
2 parents 38b1232 + 40097e7 commit f54d377

File tree

1 file changed

+4
-1
lines changed

1 file changed

+4
-1
lines changed

src/llama-build-context.cpp

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1133,7 +1133,10 @@ llm_expert_gating_func_type gating_op,
11331133
results[id] = shared_out;
11341134
}
11351135
cur = ggml_add(ctx, results[0], results[1]);
1136-
cur->op_params[0] = 0xff;
1136+
if (cur->ne[1] > 32) {
1137+
// Force a graph split
1138+
cur->op_params[0] = 0xff;
1139+
}
11371140
cb(cur, "ffn_shared_combined", il);
11381141
for (int id = 2; id < int(results.size()); ++id) {
11391142
cur = ggml_add(ctx, cur, results[id]);

0 commit comments

Comments
 (0)