Skip to content

Commit bc708b4

Browse files
committed
fix merge conflict
1 parent 1804fa2 commit bc708b4

File tree

3 files changed

+6
-1
lines changed

3 files changed

+6
-1
lines changed

tools/mtmd/clip-impl.h

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -102,6 +102,7 @@
102102
#define TN_MM_AUDIO_MLP "mm.a.mlp.%d.%s"
103103
#define TN_MM_NORM_PRE "mm.a.norm_pre.%s"
104104
#define TN_MM_NORM_MID "mm.a.norm_mid.%s"
105+
105106
// align x to upper multiple of n
106107
#define CLIP_ALIGN(x, n) ((((x) + (n) - 1) / (n)) * (n))
107108

tools/mtmd/clip.cpp

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1736,7 +1736,7 @@ static ggml_cgraph * clip_image_build_graph(clip_ctx * ctx, const clip_image_f32
17361736
} break;
17371737
case PROJECTOR_TYPE_ULTRAVOX:
17381738
{
1739-
GGML_ASSERT(imgs.entries.size() == 1);
1739+
res = nullptr;
17401740
} break;
17411741
default:
17421742
{
@@ -2205,6 +2205,7 @@ struct clip_model_loader {
22052205
vision_model.mm_2_w = get_tensor(string_format(TN_MM_AUDIO_MLP, 2, "weight"));
22062206
vision_model.mm_norm_pre_w = get_tensor(string_format(TN_MM_NORM_PRE, "weight"));
22072207
vision_model.mm_norm_mid_w = get_tensor(string_format(TN_MM_NORM_MID, "weight"));
2208+
} break;
22082209
case PROJECTOR_TYPE_INTERNVL:
22092210
{
22102211
vision_model.mm_0_w = get_tensor(string_format(TN_MVLM_PROJ_MLP, 0, "weight"));

tools/mtmd/clip.h

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -97,3 +97,6 @@ bool clip_is_llava(const struct clip_ctx * ctx);
9797
bool clip_is_gemma3(const struct clip_ctx * ctx);
9898

9999
bool clip_encode_float_image (struct clip_ctx * ctx, int n_threads, float * img, int h, int w, float * vec);
100+
101+
// use by audio input
102+
void clip_image_f32_batch_add_mel(struct clip_image_f32_batch * batch, int n_mel, int n_step, float * mel);

0 commit comments

Comments
 (0)