# HF libraries from langchain_huggingface import HuggingFaceEndpoint from langchain.agents import AgentExecutor from langchain.agents.format_scratchpad import format_log_to_str from langchain.agents.output_parsers import ReActJsonSingleInputOutputParser # Import things that are needed generically from langchain.tools.render import render_text_description import os from dotenv import load_dotenv # local cache from langchain.globals import set_llm_cache from langchain_community.cache import SQLiteCache # sqlite #from langchain.cache import InMemoryCache # in memory cache from rag_app.structured_tools.structured_tools import ( google_search, knowledgeBase_search ) from langchain.prompts import PromptTemplate from rag_app.templates.react_json_with_memory_ger import template_system # from innovation_pathfinder_ai.utils import logger # logger = logger.get_console_logger("hf_mixtral_agent") config = load_dotenv(".env") HUGGINGFACEHUB_API_TOKEN = os.getenv('HUGGINGFACEHUB_API_TOKEN') GOOGLE_CSE_ID = os.getenv('GOOGLE_CSE_ID') GOOGLE_API_KEY = os.getenv('GOOGLE_API_KEY') LLM_MODEL = os.getenv('LLM_MODEL') set_llm_cache(SQLiteCache(database_path=".cache.db")) # Load the model from the Hugging Face Hub llm = HuggingFaceEndpoint(repo_id=LLM_MODEL, temperature=0.1, max_new_tokens=1024, repetition_penalty=1.2, return_full_text=False ) tools = [ knowledgeBase_search, google_search, #web_research, #ask_user ] prompt = PromptTemplate.from_template( template=template_system ) prompt = prompt.partial( tools=render_text_description(tools), tool_names=", ".join([t.name for t in tools]), ) # define the agent chat_model_with_stop = llm.bind(stop=["\nObservation"]) agent = ( { "input": lambda x: x["input"], "agent_scratchpad": lambda x: format_log_to_str(x["intermediate_steps"]), "chat_history": lambda x: x["chat_history"], } | prompt | chat_model_with_stop | ReActJsonSingleInputOutputParser() ) # instantiate AgentExecutor agent_executor = AgentExecutor( agent=agent, tools=tools, verbose=True, max_iterations=20, # cap number of iterations max_execution_time=90, # timout at 60 sec return_intermediate_steps=True, handle_parsing_errors=True, )