llm: api_key: "3bf18984-b4df-49ba-a30b-6cbae3964b08" type: openai_chat model_supports_json: true model: "claude-3-5-sonnet-20240620" api_base: "http://localhost:30012/v1" # max_tokens: 10000 # Adjusted based on Claude 3 Haiku's typical context window request_timeout: 30 tokens_per_minute: 100000 requests_per_minute: 1000 max_retry_wait: 5 temperature: 0.1 embeddings: async_mode: threaded llm: type: openai_embedding model: "mixedbread-ai/mxbai-embed-large-v1" api_base: "http://localhost:7997"