Skip to content

Commit 1ef4b5e

Browse files
authored
Disable split mode graph for recurrent/hybrid models when tensor overrides (#1366)
1 parent 8fb0022 commit 1ef4b5e

File tree

1 file changed

+8
-0
lines changed

1 file changed

+8
-0
lines changed

src/llama.cpp

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1981,6 +1981,14 @@ static bool llm_load_tensors(
19811981
LLAMA_LOG_WARN("================================================================\n\n");
19821982
max_gpu = 4;
19831983
}
1984+
else if (llama_model_has_recurrent(&model) && model.has_tensor_overrides()) {
1985+
LLAMA_LOG_WARN("\n================================================================\n");
1986+
LLAMA_LOG_WARN("Split mode 'graph' for recurrent/hybrid models is currently\n");
1987+
LLAMA_LOG_WARN("disabled when using tensor overrides\n");
1988+
LLAMA_LOG_WARN(" => changing split mode to 'layer'\n");
1989+
LLAMA_LOG_WARN("=======================================================\n\n");
1990+
split_mode = LLAMA_SPLIT_MODE_LAYER;
1991+
}
19841992
}
19851993
}
19861994

0 commit comments

Comments
 (0)