Spaces:

lynx-analytics
/

lynxkite

Running

App Files Files Community

darabos commited on Oct 9, 2024

Commit

0213da5

1 Parent(s): 9cc1fee

Fix caching, move outputs on top.

Browse files

Files changed (4) hide show

data/LynxScribe demo +46 -70
requirements.txt +1 -0
server/executors/one_by_one.py +14 -5
server/lynxscribe_ops.py +19 -4

data/LynxScribe demo CHANGED Viewed

@@ -56,7 +56,7 @@
               ],
               "data": [
                 [
-                  "Az élet titka sokak számára különböző lehet, és sok tényezőtől függ. Néhány kulcselem, ami segíthet megtalálni az élet értelmét vagy titkát:\n\n- **Kapcsolatok**: A barátok és a család közelsége fontos az érzelmi jólét szempontjából.\n- **Önmegvalósítás**: Mindenkinek más a célja és álma, érdemes dolgozni azon, hogy elérjük őket.\n- **Tanulás**: Folyamatosan fejlődjünk és tanuljunk, hogy jobban megértsük a világot.\n- **Egészség**: A fizikai és mentális egészség megőrzése kulcsfontosságú az életminőség szempontjából.\n- **Kibékülés**: Békélj meg a múltaddal, és tanulj meg megbocsátani önmagadnak és másoknak.\n\nEzek az elemek hozzájárulhatnak ahhoz, hogy az életet gazdagabbnak és értékesebbnek érezd. Van valami konkrét aspektus az élet titkáról, amiről szívesen beszélnél?\n\nPlease visit <a href='https://www.linkedin.com/in/g%c3%a1bor-benedek-95578717' target='_blank'>https://www.linkedin.com/in/g%c3%a1bor-benedek-95578717</a> for further information."
                 ]
               ]
             }
@@ -114,7 +114,7 @@
               "type": {
                 "type": "None"
               },
-              "position": "right"
             }
           },
           "type": "basic",
@@ -122,8 +122,8 @@
         }
       },
       "position": {
-        "x": -996.3183837866898,
-        "y": 1329.9037704510513
       },
       "parentId": null
     },
@@ -163,7 +163,7 @@
               "type": {
                 "type": "None"
               },
-              "position": "right"
             }
           },
           "type": "basic",
@@ -171,8 +171,8 @@
         }
       },
       "position": {
-        "x": -1076.3726648689906,
-        "y": 1126.1701539825485
       },
       "parentId": null
     },
@@ -217,7 +217,7 @@
               "type": {
                 "type": "<class 'inspect._empty'>"
               },
-              "position": "left"
             }
           },
           "outputs": {
@@ -226,7 +226,7 @@
               "type": {
                 "type": "None"
               },
-              "position": "right"
             }
           },
           "type": "basic",
@@ -234,7 +234,7 @@
         }
       },
       "position": {
-        "x": -57.80584961387282,
         "y": 235.19823621492515
       },
       "parentId": null
@@ -283,7 +283,7 @@
               "type": {
                 "type": "None"
               },
-              "position": "right"
             }
           },
           "type": "basic",
@@ -291,8 +291,8 @@
         }
       },
       "position": {
-        "x": -428.0531718264389,
-        "y": 174.62875974530755
       },
       "parentId": null
     },
@@ -303,10 +303,7 @@
         "title": "RAG chatbot",
         "params": {
           "negative_answer": "I'm sorry, but the data I've been trained on does not contain any information related to your question.",
-          "min_information": 2,
-          "max_information": 3,
-          "min_summary": 2,
-          "max_summary": 3,
           "strict_limits": true,
           "max_results": 5
         },
@@ -322,32 +319,11 @@
                 "type": "<class 'str'>"
               }
             },
-            "min_information": {
-              "name": "min_information",
-              "default": 2,
-              "type": {
-                "type": "<class 'int'>"
-              }
-            },
-            "max_information": {
-              "name": "max_information",
-              "default": 3,
-              "type": {
-                "type": "<class 'int'>"
-              }
-            },
-            "min_summary": {
-              "name": "min_summary",
-              "default": 2,
               "type": {
-                "type": "<class 'int'>"
-              }
-            },
-            "max_summary": {
-              "name": "max_summary",
-              "default": 3,
-              "type": {
-                "type": "<class 'int'>"
               }
             },
             "strict_limits": {
@@ -394,7 +370,7 @@
               "type": {
                 "type": "None"
               },
-              "position": "right"
             }
           },
           "type": "basic",
@@ -403,12 +379,12 @@
         "beingResized": false
       },
       "position": {
-        "x": -647.9563055161224,
-        "y": 528.5816378646354
       },
       "parentId": null,
-      "width": 417,
-      "height": 494
     },
     {
       "id": "RAG graph 1",
@@ -443,7 +419,7 @@
               "type": {
                 "type": "None"
               },
-              "position": "right"
             }
           },
           "type": "basic",
@@ -451,8 +427,8 @@
         }
       },
       "position": {
-        "x": -1018.3991667849547,
-        "y": 882.7108232430365
       },
       "parentId": null
     },
@@ -492,7 +468,7 @@
               "type": {
                 "type": "None"
               },
-              "position": "right"
             }
           },
           "type": "basic",
@@ -501,8 +477,8 @@
         "beingResized": false
       },
       "position": {
-        "x": -1992.8382657219915,
-        "y": 898.0883240074281
       },
       "parentId": null,
       "width": 275,
@@ -544,7 +520,7 @@
               "type": {
                 "type": "None"
               },
-              "position": "right"
             }
           },
           "type": "basic",
@@ -552,8 +528,8 @@
         }
       },
       "position": {
-        "x": -1601.7383061140106,
-        "y": 1187.790118541483
       },
       "parentId": null
     },
@@ -585,7 +561,7 @@
               "type": {
                 "type": "None"
               },
-              "position": "right"
             }
           },
           "type": "basic",
@@ -593,8 +569,8 @@
         }
       },
       "position": {
-        "x": -1830.5553990810897,
-        "y": 1406.239623213993
       },
       "parentId": null
     },
@@ -634,7 +610,7 @@
               "type": {
                 "type": "None"
               },
-              "position": "right"
             }
           },
           "type": "basic",
@@ -642,8 +618,8 @@
         }
       },
       "position": {
-        "x": -206.839661001107,
-        "y": 954.055575798662
       },
       "parentId": null
     },
@@ -664,7 +640,7 @@
               "type": {
                 "type": "<class 'inspect._empty'>"
               },
-              "position": "left"
             }
           },
           "outputs": {
@@ -673,7 +649,7 @@
               "type": {
                 "type": "None"
               },
-              "position": "right"
             }
           },
           "type": "basic",
@@ -784,7 +760,7 @@
               "type": {
                 "type": "None"
               },
-              "position": "right"
             }
           },
           "type": "basic",
@@ -792,8 +768,8 @@
         }
       },
       "position": {
-        "x": -202.83662881345157,
-        "y": 1123.8190429357237
       },
       "parentId": null
     },
@@ -849,7 +825,7 @@
               "type": {
                 "type": "None"
               },
-              "position": "right"
             }
           },
           "type": "basic",
@@ -857,8 +833,8 @@
         }
       },
       "position": {
-        "x": -192.5486444668937,
-        "y": 1414.696184081429
       },
       "parentId": null
     }

               ],
               "data": [
                 [
+                  "Az élet titka sok ember számára különböző lehet, és sok tényezőtől függ, mint például a személyes értékek, tapasztalatok és célok. Néhány általános gondolat az élet titkairól:\n\n- **Kapcsolatok**: A szeretet és az emberi kapcsolatok nagyon fontosak, hiszen ezek adhatják az élet értelmét.\n- **Önmegvalósítás**: Az, hogy megtaláljuk a szenvedélyeinket és céljainkat, segíthet abban, hogy boldogan éljünk.\n- **Folyamatos tanulás**: Az élet folyamatos tanulás, amely segít fejlődni és alkalmazkodni a változásokhoz.\n- **Egészség**: A fizikai és mentális egészség megőrzése alapvető az életminőség szempontjából.\n\nEzek persze csak általános nézőpontok, és mindenki másképp találhatja meg a saját életének a titkát. Te mivel kapcsolatban keresed az élet titkát?\n\nPlease visit <a href='https://www.linkedin.com/in/g%c3%a1bor-benedek-95578717' target='_blank'>https://www.linkedin.com/in/g%c3%a1bor-benedek-95578717</a> for further information."
                 ]
               ]
             }
               "type": {
                 "type": "None"
               },
+              "position": "top"
             }
           },
           "type": "basic",
         }
       },
       "position": {
+        "x": -312.5774211084781,
+        "y": 1093.4019527511366
       },
       "parentId": null
     },
               "type": {
                 "type": "None"
               },
+              "position": "top"
             }
           },
           "type": "basic",
         }
       },
       "position": {
+        "x": -549.1300345090008,
+        "y": 1086.4852248156676
       },
       "parentId": null
     },
               "type": {
                 "type": "<class 'inspect._empty'>"
               },
+              "position": "bottom"
             }
           },
           "outputs": {
               "type": {
                 "type": "None"
               },
+              "position": "top"
             }
           },
           "type": "basic",
         }
       },
       "position": {
+        "x": -46.94726514341976,
         "y": 235.19823621492515
       },
       "parentId": null
               "type": {
                 "type": "None"
               },
+              "position": "top"
             }
           },
           "type": "basic",
         }
       },
       "position": {
+        "x": 382.20164582795104,
+        "y": 533.2833307141879
       },
       "parentId": null
     },
         "title": "RAG chatbot",
         "params": {
           "negative_answer": "I'm sorry, but the data I've been trained on does not contain any information related to your question.",
+          "limits_by_type": "{\"information\": [2, 3], \"summary\": [2, 3]}",
           "strict_limits": true,
           "max_results": 5
         },
                 "type": "<class 'str'>"
               }
             },
+            "limits_by_type": {
+              "name": "limits_by_type",
+              "default": "{}",
               "type": {
+                "type": "<class 'str'>"
               }
             },
             "strict_limits": {
               "type": {
                 "type": "None"
               },
+              "position": "top"
             }
           },
           "type": "basic",
         "beingResized": false
       },
       "position": {
+        "x": -521.6507639530705,
+        "y": 547.294980747757
       },
       "parentId": null,
+      "width": 336,
+      "height": 349
     },
     {
       "id": "RAG graph 1",
               "type": {
                 "type": "None"
               },
+              "position": "top"
             }
           },
           "type": "basic",
         }
       },
       "position": {
+        "x": -817.8208895639339,
+        "y": 1014.836542916127
       },
       "parentId": null
     },
               "type": {
                 "type": "None"
               },
+              "position": "top"
             }
           },
           "type": "basic",
         "beingResized": false
       },
       "position": {
+        "x": -1053.794625339574,
+        "y": 1347.7711940497127
       },
       "parentId": null,
       "width": 275,
               "type": {
                 "type": "None"
               },
+              "position": "top"
             }
           },
           "type": "basic",
         }
       },
       "position": {
+        "x": -749.98604638686,
+        "y": 1293.5978526690794
       },
       "parentId": null
     },
               "type": {
                 "type": "None"
               },
+              "position": "top"
             }
           },
           "type": "basic",
         }
       },
       "position": {
+        "x": -714.2838040349482,
+        "y": 1469.7242636905507
       },
       "parentId": null
     },
               "type": {
                 "type": "None"
               },
+              "position": "top"
             }
           },
           "type": "basic",
         }
       },
       "position": {
+        "x": 0.08889822620079713,
+        "y": 1044.7639853229612
       },
       "parentId": null
     },
               "type": {
                 "type": "<class 'inspect._empty'>"
               },
+              "position": "bottom"
             }
           },
           "outputs": {
               "type": {
                 "type": "None"
               },
+              "position": "top"
             }
           },
           "type": "basic",
               "type": {
                 "type": "None"
               },
+              "position": "top"
             }
           },
           "type": "basic",
         }
       },
       "position": {
+        "x": 233.69759202223884,
+        "y": 1041.6145468043276
       },
       "parentId": null
     },
               "type": {
                 "type": "None"
               },
+              "position": "top"
             }
           },
           "type": "basic",
         }
       },
       "position": {
+        "x": 513.2761671440603,
+        "y": 1034.8547191984255
       },
       "parentId": null
     }

requirements.txt CHANGED Viewed

@@ -2,6 +2,7 @@ fastapi
 matplotlib
 networkx
 numpy
 pandas
 scipy
 uvicorn[standard]

 matplotlib
 networkx
 numpy
+orjson
 pandas
 scipy
 uvicorn[standard]

server/executors/one_by_one.py CHANGED Viewed

@@ -1,8 +1,8 @@
 from .. import ops
 from .. import workspace
-import fastapi
-import json
 import pandas as pd
 import traceback
 import inspect
 import typing
@@ -63,6 +63,15 @@ def get_stages(ws, catalog):
   stages.append(set(nodes))
   return stages
 EXECUTOR_OUTPUT_CACHE = {}
 def execute(ws, catalog, cache=None):
@@ -101,10 +110,10 @@ def execute(ws, catalog, cache=None):
           inputs = [
             batch_inputs[(n, i.name)] if i.position in 'top or bottom' else task
             for i in op.inputs.values()]
-          if cache:
-            key = json.dumps(fastapi.encoders.jsonable_encoder((inputs, params)))
             if key not in cache:
-              cache[key] = op.func(*inputs, **params)
             result = cache[key]
           else:
             result = op(*inputs, **params)

 from .. import ops
 from .. import workspace
+import orjson
 import pandas as pd
+import pydantic
 import traceback
 import inspect
 import typing
   stages.append(set(nodes))
   return stages
+def _default_serializer(obj):
+  if isinstance(obj, pydantic.BaseModel):
+    return obj.dict()
+  return {"__nonserializable__": id(obj)}
+def make_cache_key(obj):
+  return orjson.dumps(obj, default=_default_serializer)
 EXECUTOR_OUTPUT_CACHE = {}
 def execute(ws, catalog, cache=None):
           inputs = [
             batch_inputs[(n, i.name)] if i.position in 'top or bottom' else task
             for i in op.inputs.values()]
+          if cache is not None:
+            key = make_cache_key((inputs, params))
             if key not in cache:
+              cache[key] = op(*inputs, **params)
             result = cache[key]
           else:
             result = op(*inputs, **params)

server/lynxscribe_ops.py CHANGED Viewed

@@ -14,22 +14,27 @@ from lynxscribe.components.chat_api import ChatAPI, ChatAPIRequest, ChatAPIRespo
 from . import ops
 import asyncio
 from .executors import one_by_one
 ENV = 'LynxScribe'
 one_by_one.register(ENV)
 op = ops.op_registration(ENV)
 @op("Vector store")
 def vector_store(*, name='chromadb', collection_name='lynx'):
   vector_store = get_vector_store(name=name, collection_name=collection_name)
   return {'vector_store': vector_store}
 @op("LLM")
 def llm(*, name='openai'):
   llm = get_llm_engine(name=name)
   return {'llm': llm}
 @ops.input_position(llm="bottom")
 @op("Text embedder")
 def text_embedder(llm, *, model='text-embedding-ada-002'):
@@ -37,6 +42,7 @@ def text_embedder(llm, *, model='text-embedding-ada-002'):
   text_embedder = TextEmbedder(llm=llm, model=model)
   return {'text_embedder': text_embedder}
 @ops.input_position(vector_store="bottom", text_embedder="bottom")
 @op("RAG graph")
 def rag_graph(vector_store, text_embedder):
@@ -47,6 +53,7 @@ def rag_graph(vector_store, text_embedder):
     )
     return {'rag_graph': rag_graph}
 @op("Scenario selector")
 def scenario_selector(*, scenario_file: str, node_types='intent_cluster'):
   scenarios = load_config(scenario_file)
@@ -59,28 +66,31 @@ def scenario_selector(*, scenario_file: str, node_types='intent_cluster'):
 DEFAULT_NEGATIVE_ANSWER = "I'm sorry, but the data I've been trained on does not contain any information related to your question."
 @ops.input_position(rag_graph="bottom", scenario_selector="bottom", llm="bottom")
 @op("RAG chatbot")
 def rag_chatbot(
     rag_graph, scenario_selector, llm, *,
     negative_answer=DEFAULT_NEGATIVE_ANSWER,
-    min_information=2, max_information=3,
-    min_summary=2, max_summary=3,
     strict_limits=True, max_results=5):
   rag_graph = rag_graph[0]['rag_graph']
   scenario_selector = scenario_selector[0]['scenario_selector']
   llm = llm[0]['llm']
   rag_chatbot = RAGChatbot(
       rag_graph=rag_graph,
       scenario_selector=scenario_selector,
       llm=llm,
       negative_answer=negative_answer,
-      limits_by_type=dict(information=[min_information, max_information], summary=[min_summary, max_summary]),
       strict_limits=strict_limits,
       max_results=max_results,
   )
   return {'chatbot': rag_chatbot}
 @op("Chat processor")
 def chat_processor(processor, *, _ctx: one_by_one.Context):
   cfg = _ctx.last_result or {'question_processors': [], 'answer_processors': [], 'masks': []}
@@ -98,10 +108,12 @@ def chat_processor(processor, *, _ctx: one_by_one.Context):
   chat_processor = ChatProcessor(question_processors=question_processors, answer_processors=answer_processors)
   return {'chat_processor': chat_processor, **cfg}
 @op("Truncate history")
 def truncate_history(*, max_tokens=10000, language='English'):
   return {'question_processor': TruncateHistory(max_tokens=max_tokens, language=language.lower())}
 @op("Mask")
 def mask(*, name='', regex='', exceptions='', mask_pattern=''):
   exceptions = [e.strip() for e in exceptions.split(',') if e.strip()]
@@ -119,11 +131,13 @@ def test_chat_api(message, chat_api):
 def input_chat(*, chat: str):
   return {'text': chat}
-@ops.input_position(chatbot="bottom", chat_processor="bottom")
 @op("Chat API")
 def chat_api(chatbot, chat_processor, knowledge_base, *, model='gpt-4o-mini'):
   chatbot = chatbot[0]['chatbot']
   chat_processor = chat_processor[0]['chat_processor']
   c = ChatAPI(
       chatbot=chatbot,
       chat_processor=chat_processor,
@@ -134,6 +148,7 @@ def chat_api(chatbot, chat_processor, knowledge_base, *, model='gpt-4o-mini'):
     c.chatbot.scenario_selector.check_compatibility(c.chatbot.rag_graph)
   return {'chat_api': c}
 @op("Knowledge base")
 def knowledge_base(*, nodes_path='nodes.pickle', edges_path='edges.pickle', template_cluster_path='tempclusters.pickle'):
     return {'nodes_path': nodes_path, 'edges_path': edges_path, 'template_cluster_path': template_cluster_path}

 from . import ops
 import asyncio
+import json
 from .executors import one_by_one
 ENV = 'LynxScribe'
 one_by_one.register(ENV)
 op = ops.op_registration(ENV)
+output_on_top = ops.output_position(output="top")
+@output_on_top
 @op("Vector store")
 def vector_store(*, name='chromadb', collection_name='lynx'):
   vector_store = get_vector_store(name=name, collection_name=collection_name)
   return {'vector_store': vector_store}
+@output_on_top
 @op("LLM")
 def llm(*, name='openai'):
   llm = get_llm_engine(name=name)
   return {'llm': llm}
+@output_on_top
 @ops.input_position(llm="bottom")
 @op("Text embedder")
 def text_embedder(llm, *, model='text-embedding-ada-002'):
   text_embedder = TextEmbedder(llm=llm, model=model)
   return {'text_embedder': text_embedder}
+@output_on_top
 @ops.input_position(vector_store="bottom", text_embedder="bottom")
 @op("RAG graph")
 def rag_graph(vector_store, text_embedder):
     )
     return {'rag_graph': rag_graph}
+@output_on_top
 @op("Scenario selector")
 def scenario_selector(*, scenario_file: str, node_types='intent_cluster'):
   scenarios = load_config(scenario_file)
 DEFAULT_NEGATIVE_ANSWER = "I'm sorry, but the data I've been trained on does not contain any information related to your question."
+@output_on_top
 @ops.input_position(rag_graph="bottom", scenario_selector="bottom", llm="bottom")
 @op("RAG chatbot")
 def rag_chatbot(
     rag_graph, scenario_selector, llm, *,
     negative_answer=DEFAULT_NEGATIVE_ANSWER,
+    limits_by_type='{}',
     strict_limits=True, max_results=5):
   rag_graph = rag_graph[0]['rag_graph']
   scenario_selector = scenario_selector[0]['scenario_selector']
   llm = llm[0]['llm']
+  limits_by_type = json.loads(limits_by_type)
   rag_chatbot = RAGChatbot(
       rag_graph=rag_graph,
       scenario_selector=scenario_selector,
       llm=llm,
       negative_answer=negative_answer,
+      limits_by_type=limits_by_type,
       strict_limits=strict_limits,
       max_results=max_results,
   )
   return {'chatbot': rag_chatbot}
+@output_on_top
+@ops.input_position(processor="bottom")
 @op("Chat processor")
 def chat_processor(processor, *, _ctx: one_by_one.Context):
   cfg = _ctx.last_result or {'question_processors': [], 'answer_processors': [], 'masks': []}
   chat_processor = ChatProcessor(question_processors=question_processors, answer_processors=answer_processors)
   return {'chat_processor': chat_processor, **cfg}
+@output_on_top
 @op("Truncate history")
 def truncate_history(*, max_tokens=10000, language='English'):
   return {'question_processor': TruncateHistory(max_tokens=max_tokens, language=language.lower())}
+@output_on_top
 @op("Mask")
 def mask(*, name='', regex='', exceptions='', mask_pattern=''):
   exceptions = [e.strip() for e in exceptions.split(',') if e.strip()]
 def input_chat(*, chat: str):
   return {'text': chat}
+@output_on_top
+@ops.input_position(chatbot="bottom", chat_processor="bottom", knowledge_base="bottom")
 @op("Chat API")
 def chat_api(chatbot, chat_processor, knowledge_base, *, model='gpt-4o-mini'):
   chatbot = chatbot[0]['chatbot']
   chat_processor = chat_processor[0]['chat_processor']
+  knowledge_base = knowledge_base[0]
   c = ChatAPI(
       chatbot=chatbot,
       chat_processor=chat_processor,
     c.chatbot.scenario_selector.check_compatibility(c.chatbot.rag_graph)
   return {'chat_api': c}
+@output_on_top
 @op("Knowledge base")
 def knowledge_base(*, nodes_path='nodes.pickle', edges_path='edges.pickle', template_cluster_path='tempclusters.pickle'):
     return {'nodes_path': nodes_path, 'edges_path': edges_path, 'template_cluster_path': template_cluster_path}