mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2026-05-22 11:16:08 +00:00
server: re-inject subcommand when router spawns children under unified binary (#23442)
This commit is contained in:
parent
1d7ab2b947
commit
c9021714e8
2 changed files with 17 additions and 0 deletions
|
|
@ -1,6 +1,7 @@
|
|||
#include "build-info.h"
|
||||
|
||||
#include <cstdio>
|
||||
#include <cstdlib>
|
||||
#include <string>
|
||||
#include <vector>
|
||||
|
||||
|
|
@ -77,6 +78,14 @@ int main(int argc, char ** argv) {
|
|||
|
||||
for (const auto & cmd : cmds) {
|
||||
if (matches(arg, cmd)) {
|
||||
|
||||
// router spawns children through this same binary, it needs the
|
||||
// subcommand to relaunch as 'llama serve' and not bare options
|
||||
#ifdef _WIN32
|
||||
_putenv_s("LLAMA_APP_CMD", cmd.name);
|
||||
#else
|
||||
setenv("LLAMA_APP_CMD", cmd.name, 1);
|
||||
#endif
|
||||
return cmd.func(argc - 1, argv + 1);
|
||||
}
|
||||
}
|
||||
|
|
|
|||
|
|
@ -14,6 +14,7 @@
|
|||
#include <mutex>
|
||||
#include <condition_variable>
|
||||
#include <cstring>
|
||||
#include <cstdlib>
|
||||
#include <atomic>
|
||||
#include <chrono>
|
||||
#include <queue>
|
||||
|
|
@ -159,6 +160,13 @@ void server_model_meta::update_args(common_preset_context & ctx_preset, std::str
|
|||
// TODO: maybe validate preset before rendering ?
|
||||
// render args
|
||||
args = preset.to_args(bin_path);
|
||||
|
||||
// unified binary dispatches by subcommand, re-inject it right after the
|
||||
// binary path so the child starts as 'llama serve ...' not 'llama ...'
|
||||
const char * app_cmd = std::getenv("LLAMA_APP_CMD");
|
||||
if (app_cmd != nullptr && app_cmd[0] != '\0' && !bin_path.empty()) {
|
||||
args.insert(args.begin() + 1, app_cmd);
|
||||
}
|
||||
}
|
||||
|
||||
void server_model_meta::update_caps() {
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue