invenxion-chatbot_local

Sleeping

App Files Files Community

Ibraaheem commited on Jan 9, 2024

Commit

af78253

1 Parent(s): 1aaaabf

Update private_gpt/components/llm/llm_component.py

Browse files

Files changed (1) hide show

private_gpt/components/llm/llm_component.py +25 -41

private_gpt/components/llm/llm_component.py CHANGED Viewed

@@ -1,6 +1,5 @@
 import logging
-from typing import List
 from injector import inject, singleton
 from llama_index.llms import MockLLM
 from llama_index.llms.base import LLM
@@ -11,27 +10,19 @@ from private_gpt.components.llm.prompt_helper import get_prompt_style
 from private_gpt.paths import models_path
 from private_gpt.settings.settings import Settings
-import os
 logger = logging.getLogger(__name__)
-model_url: "https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/raw/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf"
 @singleton
 class LLMComponent:
     llm: LLM
     @inject
-    def __init__(self, settings: Settings, allowed_modes: List[str]) -> None:
-        llm_mode = "local"
         logger.info("Initializing the LLM in mode=%s", llm_mode)
-        allowed_modes = ["local", "openai", "sagemaker", "mock"]
-        if llm_mode not in allowed_modes:
-            raise ValueError(f"Invalid LLM mode: {llm_mode}")
-        match llm_mode:
             case "local":
                 from llama_index.llms import LlamaCPP
                 prompt_style_cls = get_prompt_style(settings.local.prompt_style)
@@ -39,8 +30,7 @@ class LLMComponent:
                     default_system_prompt=settings.local.default_system_prompt
                 )
                 self.llm = LlamaCPP(
-                    #model_path=str(models_path / settings.local.llm_hf_model_file),
-                    model_url= "https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf?download=true",
                     temperature=0.1,
                     max_new_tokens=settings.llm.max_new_tokens,
                     context_window=3900,
@@ -61,42 +51,45 @@ class LLMComponent:
                 #default startup
                 logger.info("Initializing the GPT Model in=%s", "gpt-3.5-turbo")
-                self.llm = OpenAI(model="gpt-3.5-turbo", api_key=os.environ.get("OPENAI_API_KEY"))
-            case "mock":
-                self.llm = MockLLM()
             case "dynamic":
-                #default startup
-                self.switch_model("gpt-3.5-turbo", settings)
     def switch_model(self, new_model: str, settings: Settings) -> None:
         openai_settings = settings.openai.api_key
         if new_model == "gpt-3.5-turbo":
-            self.llm = OpenAI(model="gpt-3.5-turbo", api_key=os.environ.get("OPENAI_API_KEY"))
-            logger.info("Initializing the LLM Model in=%s", "gpt-3.5-turbo")
         elif new_model == "gpt-4":
             # Initialize with the new model
-            self.llm = OpenAI(model="gpt-4", api_key=os.environ.get("OPENAI_API_KEY"))
-            logger.info("Initializing the LLM Model in=%s", "gpt-4")
         elif new_model == "mistral-7B":
-            from llama_index.llms import LlamaCPP
             prompt_style_cls = get_prompt_style(settings.local.prompt_style)
             prompt_style = prompt_style_cls(
                 default_system_prompt=settings.local.default_system_prompt
             )
             self.llm = LlamaCPP(
-                #model_path=str(models_path / settings.local.llm_hf_model_file),
-                model_url= "https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf?download=true",
                 temperature=0.1,
                 max_new_tokens=settings.llm.max_new_tokens,
                 context_window=3900,
@@ -106,15 +99,6 @@ class LLMComponent:
                 completion_to_prompt=prompt_style.completion_to_prompt,
                 verbose=True,
             )
-            logger.info("Initializing the LLM Model in=%s", "Mistral-7B")
-        return self

 import logging
+import os
 from injector import inject, singleton
 from llama_index.llms import MockLLM
 from llama_index.llms.base import LLM
 from private_gpt.paths import models_path
 from private_gpt.settings.settings import Settings
 logger = logging.getLogger(__name__)
 @singleton
 class LLMComponent:
     llm: LLM
     @inject
+    def __init__(self, settings: Settings) -> None:
+        llm_mode = settings.llm.mode
         logger.info("Initializing the LLM in mode=%s", llm_mode)
+        match settings.llm.mode:
             case "local":
                 from llama_index.llms import LlamaCPP
                 prompt_style_cls = get_prompt_style(settings.local.prompt_style)
                     default_system_prompt=settings.local.default_system_prompt
                 )
                 self.llm = LlamaCPP(
+                    model_path=str(models_path / settings.local.llm_hf_model_file),
                     temperature=0.1,
                     max_new_tokens=settings.llm.max_new_tokens,
                     context_window=3900,
                 #default startup
                 logger.info("Initializing the GPT Model in=%s", "gpt-3.5-turbo")
+                self.llm = OpenAI(model="gpt-3.5-turbo", api_key=openai_settings)
             case "dynamic":
+                from llama_index.llms import OpenAI
+                openai_settings = settings.openai.api_key
+                #default startup
+                logger.info("Initializing the GPT Model in=%s", "gpt-3.5-turbo")
+                self.llm = OpenAI(model="gpt-3.5-turbo", api_key=openai_settings)
+            case "mock":
+                self.llm = MockLLM()
+    @inject
     def switch_model(self, new_model: str, settings: Settings) -> None:
+        from llama_index.llms import LlamaCPP
         openai_settings = settings.openai.api_key
         if new_model == "gpt-3.5-turbo":
+            self.llm = OpenAI(model="gpt-3.5-turbo", api_key=openai_settings)
         elif new_model == "gpt-4":
             # Initialize with the new model
+            self.llm = OpenAI(model="gpt-4", api_key=openai_settings)
+            logger.info("Initializing the GPT Model in=%s", "gpt-4")
         elif new_model == "mistral-7B":
+            model_url= "https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf?download=true"
+            #model_filename = os.path.basename(model_url)
             prompt_style_cls = get_prompt_style(settings.local.prompt_style)
             prompt_style = prompt_style_cls(
                 default_system_prompt=settings.local.default_system_prompt
             )
             self.llm = LlamaCPP(
+                model_path=str(models_path / settings.local.llm_hf_model_file),
+                #model_url= model_filename,
                 temperature=0.1,
                 max_new_tokens=settings.llm.max_new_tokens,
                 context_window=3900,
                 completion_to_prompt=prompt_style.completion_to_prompt,
                 verbose=True,
             )