use generation config from json file in official repo

2025-09-10 06:14:58 +00:00 · 2025-02-27 11:48:34 +00:00 · 2025-02-27 11:48:34 +00:00 · e645d84794
commit e645d84794
parent 9660b2cc1e
4 changed files with 57 additions and 21 deletions
--- a/ktransformers/util/utils.py
+++ b/ktransformers/util/utils.py
@ -184,8 +184,9 @@ def prefill_and_generate(model, tokenizer, inputs, max_new_tokens=10000, use_cud
            inputs_embeds = inputs_embeds, cache_position=cache_position, past_key_values=past_key_values, return_dict=False, use_cache=True
        )[0][:,-1,:].unsqueeze(0).clone().to(torch_device)
        generation_config, model_kwargs = model._prepare_generation_config(
-            None, max_length=max_new_tokens,
-            do_sample=True, top_k=5, top_p=0.85, temperature=0.1 # change this to modify generate config
+            None, do_sample=True
+            # change this to modify generate config
+            #top_k=5, top_p=0.85, temperature=0.1
        )
        try: # transformers==4.43
            logits_warper = (