Spaces:

Raju2024
/

TestLLM

Runtime error

App Files Files Community

TestLLM / enterprise /enterprise_callbacks /generic_api_callback.py

Raju2024

Upload 1072 files

e3278e4 verified 5 months ago

raw

history blame contribute delete

4.61 kB

	# callback to make a request to an API endpoint

	#### What this does ####
	# On success, logs events to Promptlayer
	import os


	from typing import Optional

	import traceback


	#### What this does ####
	# On success + failure, log events to Supabase

	import litellm
	import uuid
	from litellm._logging import print_verbose, verbose_logger


	class GenericAPILogger:
	# Class variables or attributes
	def __init__(self, endpoint: Optional[str] = None, headers: Optional[dict] = None):
	try:
	if endpoint is None:
	# check env for "GENERIC_LOGGER_ENDPOINT"
	if os.getenv("GENERIC_LOGGER_ENDPOINT"):
	# Do something with the endpoint
	endpoint = os.getenv("GENERIC_LOGGER_ENDPOINT")
	else:
	# Handle the case when the endpoint is not found in the environment variables
	raise ValueError(
	"endpoint not set for GenericAPILogger, GENERIC_LOGGER_ENDPOINT not found in environment variables"
	)
	headers = headers or litellm.generic_logger_headers

	if endpoint is None:
	raise ValueError("endpoint not set for GenericAPILogger")
	if headers is None:
	raise ValueError("headers not set for GenericAPILogger")

	self.endpoint = endpoint
	self.headers = headers

	verbose_logger.debug(
	f"in init GenericAPILogger, endpoint {self.endpoint}, headers {self.headers}"
	)

	pass

	except Exception as e:
	print_verbose(f"Got exception on init GenericAPILogger client {str(e)}")
	raise e

	# This is sync, because we run this in a separate thread. Running in a sepearate thread ensures it will never block an LLM API call
	# Experience with s3, Langfuse shows that async logging events are complicated and can block LLM calls
	def log_event(
	self, kwargs, response_obj, start_time, end_time, user_id, print_verbose
	):
	try:
	verbose_logger.debug(
	f"GenericAPILogger Logging - Enters logging function for model {kwargs}"
	)

	# construct payload to send custom logger
	# follows the same params as langfuse.py
	litellm_params = kwargs.get("litellm_params", {})
	metadata = (
	litellm_params.get("metadata", {}) or {}
	) # if litellm_params['metadata'] == None
	messages = kwargs.get("messages")
	cost = kwargs.get("response_cost", 0.0)
	optional_params = kwargs.get("optional_params", {})
	call_type = kwargs.get("call_type", "litellm.completion")
	cache_hit = kwargs.get("cache_hit", False)
	usage = response_obj["usage"]
	id = response_obj.get("id", str(uuid.uuid4()))

	# Build the initial payload
	payload = {
	"id": id,
	"call_type": call_type,
	"cache_hit": cache_hit,
	"startTime": start_time,
	"endTime": end_time,
	"model": kwargs.get("model", ""),
	"user": kwargs.get("user", ""),
	"modelParameters": optional_params,
	"messages": messages,
	"response": response_obj,
	"usage": usage,
	"metadata": metadata,
	"cost": cost,
	}

	# Ensure everything in the payload is converted to str
	for key, value in payload.items():
	try:
	payload[key] = str(value)
	except Exception:
	# non blocking if it can't cast to a str
	pass

	import json

	data = {
	"data": payload,
	}
	data = json.dumps(data)
	print_verbose(f"\nGeneric Logger - Logging payload = {data}")

	# make request to endpoint with payload
	response = litellm.module_level_client.post(
	self.endpoint, json=data, headers=self.headers
	)

	response_status = response.status_code
	response_text = response.text

	print_verbose(
	f"Generic Logger - final response status = {response_status}, response text = {response_text}"
	)
	return response
	except Exception as e:
	verbose_logger.error(f"Generic - {str(e)}\n{traceback.format_exc()}")
	pass