open-notebook/open_notebook/graphs/utils.py
2024-11-01 22:43:33 -03:00

59 lines
1.9 KiB
Python

from langchain.output_parsers import OutputFixingParser
from langchain_core.messages import AIMessage
from loguru import logger
from open_notebook.domain.models import model_manager
from open_notebook.prompter import Prompter
from open_notebook.utils import token_count
def provision_model(content, config, default_type):
"""
Returns the best model to use based on the context size and on whether there is a specific model being requested in Config.
If context > 105_000, returns the large_context_model
If model_id is specified in Config, returns that model
Otherwise, returns the default model for the given type
"""
tokens = token_count(content)
if tokens > 105_000:
logger.debug(
f"Using large context model because the content has {tokens} tokens"
)
return model_manager.get_default_model("large_context").to_langchain()
elif config.get("configurable", {}).get("model_id"):
return model_manager.get_model(
config.get("configurable", {}).get("model_id")
).to_langchain()
else:
return model_manager.get_default_model(default_type).to_langchain()
# todo: turn into a graph
def run_pattern(
pattern_name: str,
config,
messages=[],
state: dict = {},
parser=None,
output_fixing_model_id=None,
) -> AIMessage:
system_prompt = Prompter(prompt_template=pattern_name, parser=parser).render(
data=state
)
payload = [system_prompt] + messages
chain = provision_model(str(payload), config, "transformation")
if parser:
chain = chain | parser
if output_fixing_model_id and parser:
output_fix_model = model_manager.get_model(output_fixing_model_id)
chain = chain | OutputFixingParser.from_llm(
parser=parser,
llm=output_fix_model,
)
response = chain.invoke(payload)
return response