Skip to content

Commit bb5e624

Browse files
committed
Misc. fixes.
1 parent 14921d3 commit bb5e624

File tree

2 files changed

+2
-1
lines changed

2 files changed

+2
-1
lines changed

src/llama-arch.cpp

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2546,6 +2546,7 @@ static const std::map<llm_tensor, llm_tensor_info> LLM_TENSOR_INFOS = {
25462546
{LLM_TENSOR_SSM_X, {LLM_TENSOR_LAYER_REPEATING, GGML_OP_MUL_MAT}},
25472547
{LLM_TENSOR_SSM_DT, {LLM_TENSOR_LAYER_REPEATING, GGML_OP_MUL_MAT}},
25482548
{LLM_TENSOR_SSM_OUT, {LLM_TENSOR_LAYER_REPEATING, GGML_OP_MUL_MAT}},
2549+
{LLM_TENSOR_SSM_BETA_ALPHA, {LLM_TENSOR_LAYER_REPEATING, GGML_OP_MUL_MAT}},
25492550
{LLM_TENSOR_TIME_MIX_W1, {LLM_TENSOR_LAYER_REPEATING, GGML_OP_MUL_MAT}},
25502551
{LLM_TENSOR_TIME_MIX_W2, {LLM_TENSOR_LAYER_REPEATING, GGML_OP_MUL_MAT}},
25512552
{LLM_TENSOR_TIME_MIX_A1, {LLM_TENSOR_LAYER_REPEATING, GGML_OP_MUL_MAT}},

src/llama-context.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1388,7 +1388,7 @@ void llama_context::output_reorder() {
13881388

13891389
uint32_t llama_context::graph_max_nodes() const {
13901390
if (model.arch == LLM_ARCH_QWEN3NEXT) {
1391-
return std::max<uint32_t>(8192, 32u*model.n_tensors());
1391+
return std::max<uint32_t>(8192u, 32u*model.n_tensors());
13921392
}
13931393
return std::max<uint32_t>(1024u, 8u*model.n_tensors());
13941394
}

0 commit comments

Comments
 (0)