Spaces:
Running
Running
from typing import Any | |
OPENAI_MODELS = [ | |
"text-davinci-003", | |
"text-davinci-002", | |
"text-curie-001", | |
"text-babbage-001", | |
"text-ada-001", | |
] | |
CHAT_OPENAI_MODELS = [ | |
"gpt-4o", | |
"gpt-4-turbo-preview", | |
"gpt-4-0125-preview", | |
"gpt-4-1106-preview", | |
"gpt-4-vision-preview", | |
"gpt-3.5-turbo-0125", | |
"gpt-3.5-turbo-1106", | |
] | |
ANTHROPIC_MODELS = [ | |
# largest model, ideal for a wide range of more complex tasks. | |
"claude-v1", | |
# An enhanced version of claude-v1 with a 100,000 token (roughly 75,000 word) context window. | |
"claude-v1-100k", | |
# A smaller model with far lower latency, sampling at roughly 40 words/sec! | |
"claude-instant-v1", | |
# Like claude-instant-v1 with a 100,000 token context window but retains its performance. | |
"claude-instant-v1-100k", | |
# Specific sub-versions of the above models: | |
# Vs claude-v1.2: better instruction-following, code, and non-English dialogue and writing. | |
"claude-v1.3", | |
# An enhanced version of claude-v1.3 with a 100,000 token (roughly 75,000 word) context window. | |
"claude-v1.3-100k", | |
# Vs claude-v1.1: small adv in general helpfulness, instruction following, coding, and other tasks. | |
"claude-v1.2", | |
# An earlier version of claude-v1. | |
"claude-v1.0", | |
# Latest version of claude-instant-v1. Better than claude-instant-v1.0 at most tasks. | |
"claude-instant-v1.1", | |
# Version of claude-instant-v1.1 with a 100K token context window. | |
"claude-instant-v1.1-100k", | |
# An earlier version of claude-instant-v1. | |
"claude-instant-v1.0", | |
] | |
DEFAULT_PYTHON_FUNCTION = """ | |
def python_function(text: str) -> str: | |
\"\"\"This is a default python function that returns the input text\"\"\" | |
return text | |
""" | |
PYTHON_BASIC_TYPES = [str, bool, int, float, tuple, list, dict, set] | |
DIRECT_TYPES = [ | |
"str", | |
"bool", | |
"dict", | |
"int", | |
"float", | |
"Any", | |
"prompt", | |
"code", | |
"NestedDict", | |
"table", | |
] | |
LOADERS_INFO: list[dict[str, Any]] = [ | |
{ | |
"loader": "AirbyteJSONLoader", | |
"name": "Airbyte JSON (.jsonl)", | |
"import": "langchain_community.document_loaders.AirbyteJSONLoader", | |
"defaultFor": ["jsonl"], | |
"allowdTypes": ["jsonl"], | |
}, | |
{ | |
"loader": "JSONLoader", | |
"name": "JSON (.json)", | |
"import": "langchain_community.document_loaders.JSONLoader", | |
"defaultFor": ["json"], | |
"allowdTypes": ["json"], | |
}, | |
{ | |
"loader": "BSHTMLLoader", | |
"name": "BeautifulSoup4 HTML (.html, .htm)", | |
"import": "langchain_community.document_loaders.BSHTMLLoader", | |
"allowdTypes": ["html", "htm"], | |
}, | |
{ | |
"loader": "CSVLoader", | |
"name": "CSV (.csv)", | |
"import": "langchain_community.document_loaders.CSVLoader", | |
"defaultFor": ["csv"], | |
"allowdTypes": ["csv"], | |
}, | |
{ | |
"loader": "CoNLLULoader", | |
"name": "CoNLL-U (.conllu)", | |
"import": "langchain_community.document_loaders.CoNLLULoader", | |
"defaultFor": ["conllu"], | |
"allowdTypes": ["conllu"], | |
}, | |
{ | |
"loader": "EverNoteLoader", | |
"name": "EverNote (.enex)", | |
"import": "langchain_community.document_loaders.EverNoteLoader", | |
"defaultFor": ["enex"], | |
"allowdTypes": ["enex"], | |
}, | |
{ | |
"loader": "FacebookChatLoader", | |
"name": "Facebook Chat (.json)", | |
"import": "langchain_community.document_loaders.FacebookChatLoader", | |
"allowdTypes": ["json"], | |
}, | |
{ | |
"loader": "OutlookMessageLoader", | |
"name": "Outlook Message (.msg)", | |
"import": "langchain_community.document_loaders.OutlookMessageLoader", | |
"defaultFor": ["msg"], | |
"allowdTypes": ["msg"], | |
}, | |
{ | |
"loader": "PyPDFLoader", | |
"name": "PyPDF (.pdf)", | |
"import": "langchain_community.document_loaders.PyPDFLoader", | |
"defaultFor": ["pdf"], | |
"allowdTypes": ["pdf"], | |
}, | |
{ | |
"loader": "STRLoader", | |
"name": "Subtitle (.str)", | |
"import": "langchain_community.document_loaders.STRLoader", | |
"defaultFor": ["str"], | |
"allowdTypes": ["str"], | |
}, | |
{ | |
"loader": "TextLoader", | |
"name": "Text (.txt)", | |
"import": "langchain_community.document_loaders.TextLoader", | |
"defaultFor": ["txt"], | |
"allowdTypes": ["txt"], | |
}, | |
{ | |
"loader": "UnstructuredEmailLoader", | |
"name": "Unstructured Email (.eml)", | |
"import": "langchain_community.document_loaders.UnstructuredEmailLoader", | |
"defaultFor": ["eml"], | |
"allowdTypes": ["eml"], | |
}, | |
{ | |
"loader": "UnstructuredHTMLLoader", | |
"name": "Unstructured HTML (.html, .htm)", | |
"import": "langchain_community.document_loaders.UnstructuredHTMLLoader", | |
"defaultFor": ["html", "htm"], | |
"allowdTypes": ["html", "htm"], | |
}, | |
{ | |
"loader": "UnstructuredMarkdownLoader", | |
"name": "Unstructured Markdown (.md)", | |
"import": "langchain_community.document_loaders.UnstructuredMarkdownLoader", | |
"defaultFor": ["md", "mdx"], | |
"allowdTypes": ["md", "mdx"], | |
}, | |
{ | |
"loader": "UnstructuredPowerPointLoader", | |
"name": "Unstructured PowerPoint (.pptx)", | |
"import": "langchain_community.document_loaders.UnstructuredPowerPointLoader", | |
"defaultFor": ["pptx"], | |
"allowdTypes": ["pptx"], | |
}, | |
{ | |
"loader": "UnstructuredWordLoader", | |
"name": "Unstructured Word (.docx)", | |
"import": "langchain_community.document_loaders.UnstructuredWordLoader", | |
"defaultFor": ["docx"], | |
"allowdTypes": ["docx"], | |
}, | |
] | |
MESSAGE_SENDER_AI = "Machine" | |
MESSAGE_SENDER_USER = "User" | |
MESSAGE_SENDER_NAME_AI = "AI" | |
MESSAGE_SENDER_NAME_USER = "User" | |
MAX_TEXT_LENGTH = 99999 | |