diff --git a/Makefile b/Makefile index dd93602e0..9f912d812 100644 --- a/Makefile +++ b/Makefile @@ -714,7 +714,7 @@ ttsmain: tools/tts/tts.cpp common/arg.cpp build-info.h ggml.o ggml-cpu.o ggml-op $(CXX) $(CXXFLAGS) $(filter-out %.h,$^) -o $@ $(LDFLAGS) gguf-split: tools/gguf-split/gguf-split.cpp ggml.o ggml-cpu.o ggml-ops.o ggml-vec.o ggml-binops.o ggml-unops.o llama.o build-info.h llavaclip_default.o llava.o ggml-backend_default.o ggml-backend-reg_default.o $(OBJS_FULL) $(OBJS) $(CXX) $(CXXFLAGS) $(filter-out %.h,$^) -o $@ $(LDFLAGS) -mtmd-cli: tools/mtmd/mtmd-cli.cpp tools/mtmd/mtmd.cpp common/arg.cpp build-info.h ggml.o ggml-cpu.o ggml-ops.o ggml-vec.o ggml-binops.o ggml-unops.o llama.o console.o llavaclip_default.o llava.o ggml-backend_default.o ggml-backend-reg_default.o $(OBJS_FULL) $(OBJS) +mtmd-cli: tools/mtmd/mtmd-cli.cpp tools/mtmd/mtmd.cpp tools/mtmd/mtmd-helper.cpp tools/mtmd/clip.cpp common/arg.cpp build-info.h ggml.o ggml-cpu.o ggml-ops.o ggml-vec.o ggml-binops.o ggml-unops.o llama.o console.o ggml-backend_default.o ggml-backend-reg_default.o $(OBJS_FULL) $(OBJS) $(CXX) $(CXXFLAGS) $(filter-out %.h,$^) -o $@ $(LDFLAGS) mainvk: tools/main/main.cpp common/arg.cpp build-info.h ggml_v4_vulkan.o ggml-cpu.o ggml-ops.o ggml-vec.o ggml-binops.o ggml-unops.o llama.o console.o llavaclip_vulkan.o llava.o ggml-backend_vulkan.o ggml-backend-reg_vulkan.o ggml-vulkan.o $(OBJS_FULL) $(OBJS) lib/vulkan-1.lib $(CXX) $(CXXFLAGS) -DGGML_USE_VULKAN -DSD_USE_VULKAN $(filter-out %.h,$^) -o $@ $(LDFLAGS) diff --git a/gpttype_adapter.cpp b/gpttype_adapter.cpp index d66edd4d1..7bf9fb358 100644 --- a/gpttype_adapter.cpp +++ b/gpttype_adapter.cpp @@ -3089,7 +3089,7 @@ static void PrepareMediaEmbds(const int nctx, const std::vector & media_sep } else { if(debugmode==1 && !is_quiet) { - printf("\nAudio Clip Embed Chunk %i used Tokens: %d",i,chunk.clp_image_tokens); + printf("\nAudio Clip %i Embed Chunk used Tokens: %d",i,chunk.clp_image_tokens); } total_chunk_tokens += chunk.clp_image_tokens; media_objects[i].mediachunks.push_back(chunk); @@ -3480,7 +3480,7 @@ generation_outputs gpttype_generate(const generation_inputs inputs) TokenizeString(kcpp_data->prompt, embd_inp, file_format, add_bos_token); bool use_mrope = (file_format == FileFormat::GGUF_GENERIC && file_format_meta.model_architecture == GGUFArch::ARCH_QWEN2VL); TokenizeString("\n\n", media_sep, file_format, false); - TokenizeString("\nImages:\n", media_intro, file_format, false); + TokenizeString("\nAttached Media:\n", media_intro, file_format, false); if(media_composite_image_signature=="") { diff --git a/klite.embd b/klite.embd index 36c8239ed..822194c02 100644 --- a/klite.embd +++ b/klite.embd @@ -12,7 +12,7 @@ Current version indicated by LITEVER below. -->