invenxion-chatbot_local

Sleeping

App Files Files Community

Ibraaheem commited on Dec 21, 2023

Commit

3078352

1 Parent(s): 04cbfc2

Update private_gpt/components/llm/llm_component.py

Browse files

Files changed (1) hide show

private_gpt/components/llm/llm_component.py +21 -13

private_gpt/components/llm/llm_component.py CHANGED Viewed

@@ -3,16 +3,15 @@ import logging
 from injector import inject, singleton
 from llama_index.llms import MockLLM
 from llama_index.llms.base import LLM
 from private_gpt.components.llm.prompt_helper import get_prompt_style
 from private_gpt.paths import models_path
 from private_gpt.settings.settings import Settings
-import os
 logger = logging.getLogger(__name__)
 @singleton
 class LLMComponent:
     llm: LLM
@@ -21,43 +20,52 @@ class LLMComponent:
     def __init__(self, settings: Settings) -> None:
         llm_mode = settings.llm.mode
         logger.info("Initializing the LLM in mode=%s", llm_mode)
         match settings.llm.mode:
             case "local":
                 from llama_index.llms import LlamaCPP
                 prompt_style_cls = get_prompt_style(settings.local.prompt_style)
                 prompt_style = prompt_style_cls(
                     default_system_prompt=settings.local.default_system_prompt
                 )
                 self.llm = LlamaCPP(
                     model_path=str(models_path / settings.local.llm_hf_model_file),
                     temperature=0.1,
                     max_new_tokens=settings.llm.max_new_tokens,
-                    # llama2 has a context window of 4096 tokens,
-                    # but we set it lower to allow for some wiggle room
                     context_window=3900,
                     generate_kwargs={},
-                    # All to GPU
                     model_kwargs={"n_gpu_layers": -1},
-                    # transform inputs into Llama2 format
                     messages_to_prompt=prompt_style.messages_to_prompt,
                     completion_to_prompt=prompt_style.completion_to_prompt,
                     verbose=True,
                 )
             case "sagemaker":
                 from private_gpt.components.llm.custom.sagemaker import SagemakerLLM
                 self.llm = SagemakerLLM(
                     endpoint_name=settings.sagemaker.llm_endpoint_name,
                 )
             case "openai":
                 from llama_index.llms import OpenAI
-                openai_settings = os.environ.get("OPENAI_API_KEY")
-                self.llm = OpenAI(model="gpt-3.5-turbo",api_key=openai_settings)
             case "mock":
                 self.llm = MockLLM()

 from injector import inject, singleton
 from llama_index.llms import MockLLM
 from llama_index.llms.base import LLM
+from fastapi import Depends
+from llama_index.llms import OpenAI
 from private_gpt.components.llm.prompt_helper import get_prompt_style
 from private_gpt.paths import models_path
 from private_gpt.settings.settings import Settings
 logger = logging.getLogger(__name__)
 @singleton
 class LLMComponent:
     llm: LLM
     def __init__(self, settings: Settings) -> None:
         llm_mode = settings.llm.mode
         logger.info("Initializing the LLM in mode=%s", llm_mode)
         match settings.llm.mode:
             case "local":
                 from llama_index.llms import LlamaCPP
                 prompt_style_cls = get_prompt_style(settings.local.prompt_style)
                 prompt_style = prompt_style_cls(
                     default_system_prompt=settings.local.default_system_prompt
                 )
                 self.llm = LlamaCPP(
                     model_path=str(models_path / settings.local.llm_hf_model_file),
                     temperature=0.1,
                     max_new_tokens=settings.llm.max_new_tokens,
                     context_window=3900,
                     generate_kwargs={},
                     model_kwargs={"n_gpu_layers": -1},
                     messages_to_prompt=prompt_style.messages_to_prompt,
                     completion_to_prompt=prompt_style.completion_to_prompt,
                     verbose=True,
                 )
             case "sagemaker":
                 from private_gpt.components.llm.custom.sagemaker import SagemakerLLM
                 self.llm = SagemakerLLM(
                     endpoint_name=settings.sagemaker.llm_endpoint_name,
                 )
             case "openai":
                 from llama_index.llms import OpenAI
+                openai_settings = settings.openai.api_key
+                #default startup
+                logger.info("Initializing the GPT Model in=%s", "gpt-3.5-turbo")
+                self.llm = OpenAI(model="gpt-3.5-turbo", api_key=openai_settings)
             case "mock":
                 self.llm = MockLLM()
+    @inject
+    def switch_model(self, new_model: str, settings: Settings) -> None:
+        openai_settings = settings.openai.api_key
+        if type(self.llm) == OpenAI:
+            if new_model == "gpt-3.5-turbo":
+                self.llm = OpenAI(model="gpt-3.5-turbo", api_key=openai_settings)
+            elif new_model == "gpt-4":
+                # Initialize with the new model
+                self.llm = OpenAI(model="gpt-4", api_key=openai_settings)
+                logger.info("Initializing the GPT Model in=%s", "gpt-4")