Skip to content

Commit 89a3742

Browse files
committed
skip unquantizable clip layers
1 parent b8883e2 commit 89a3742

File tree

1 file changed

+11
-0
lines changed

1 file changed

+11
-0
lines changed

tools/mtmd/clip.cpp

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4149,6 +4149,17 @@ bool clip_model_quantize(const char * fname_inp, const char * fname_out, const i
41494149
{
41504150
quantize = false;
41514151
}
4152+
for(int d=0;d<ggml_n_dims(cur);++d)
4153+
{
4154+
const int64_t blck_size = ggml_blck_size(type);
4155+
if(d==0 && cur->ne[d] % blck_size != 0)
4156+
{
4157+
printf("\nSkipping %s because %d is not divisible by %d\n",name.c_str(),cur->ne[d],blck_size);
4158+
quantize = false;
4159+
break;
4160+
}
4161+
}
4162+
41524163
// //temp fix for gemma3
41534164
// if(name.find("ffn_up.weight") != std::string::npos)
41544165
// {

0 commit comments

Comments
 (0)