readme : model : mtdm : lfm2 improvements (#15476)

* Support untied embeddings * Increase number of image tokens to 1024 * Add LFM2-VL to readme * Actually use untied embeddings
2025-09-11 01:24:36 +00:00 · 2025-08-22 09:29:08 +02:00 · 2025-08-22 09:29:08 +02:00 · e288693669
commit e288693669
parent a0f98dd604
5 changed files with 11 additions and 4 deletions
--- a/tools/mtmd/clip.cpp
+++ b/tools/mtmd/clip.cpp
@ -3513,7 +3513,7 @@ bool clip_image_preprocess(struct clip_ctx * ctx, const clip_image_u8 * img, str
        const int height = img->ny;
        const int total_factor = params.patch_size * params.proj_scale_factor;
        constexpr int min_image_tokens = 64;
-        constexpr int max_image_tokens = 256;
+        constexpr int max_image_tokens = 1024;
        const float min_pixels = min_image_tokens * total_factor * total_factor;
        const float max_pixels = max_image_tokens * total_factor * total_factor;