concrete-ml-encrypted-decisiontree / play_with_endpoint.py

chore: debug

35eb1b4 over 1 year ago

3.37 kB

	import numpy as np
	import time
	import os, sys

	from pathlib import Path

	from concrete.ml.deployment import FHEModelClient

	import requests


	def to_json(python_object):
	if isinstance(python_object, bytes):
	return {"__class__": "bytes", "__value__": list(python_object)}
	raise TypeError(repr(python_object) + " is not JSON serializable")


	def from_json(python_object):
	if "__class__" in python_object:
	return bytes(python_object["__value__"])


	# TODO: put the right link `API_URL` for your entry point
	API_URL = "https://yw1dgyuig6ff5pft.us-east-1.aws.endpoints.huggingface.cloud"
	headers = {
	"Authorization": "Bearer " + os.environ.get("HF_TOKEN"),
	"Content-Type": "application/octet-stream",
	}


	def query(payload):
	response = requests.post(API_URL, headers=headers, data=payload)
	return response.json()


	path_to_model = Path("compiled_model")

	# Decision-tree in FHE
	from sklearn.datasets import fetch_openml
	from sklearn.model_selection import train_test_split
	import numpy

	features, classes = fetch_openml(data_id=44, as_frame=False, cache=True, return_X_y=True)
	classes = classes.astype(numpy.int64)

	_, X_test, _, Y_test = train_test_split(
	features,
	classes,
	test_size=0.15,
	random_state=42,
	)

	NB_SAMPLES = 2
	X_test = X_test[:NB_SAMPLES]
	Y_test = Y_test[:NB_SAMPLES]

	# Recover parameters for client side
	fhemodel_client = FHEModelClient(path_to_model)

	# Generate the keys
	fhemodel_client.generate_private_and_evaluation_keys()
	evaluation_keys = fhemodel_client.get_serialized_evaluation_keys()

	# Test the handler
	nb_good = 0
	nb_samples = len(X_test)
	verbose = False
	time_start = time.time()
	duration = 0
	is_first = True

	for i in range(nb_samples):

	# Quantize the input and encrypt it
	encrypted_inputs = fhemodel_client.quantize_encrypt_serialize(X_test[i].reshape(1, -1))

	# print(f"Size of encrypted input {sys.getsizeof(encrypted_inputs)}")
	# print(f"Size of keys {sys.getsizeof(evaluation_keys)}")

	# Prepare the payload, including the evaluation keys which are needed server side
	payload = {
	"inputs": "fake",
	# "encrypted_inputs": to_json(encrypted_inputs),
	# "evaluation_keys": to_json(evaluation_keys),
	"encrypted_inputs": encrypted_inputs,
	"evaluation_keys": evaluation_keys,
	}

	print(f"{payload=}")

	# Run the inference on HF servers
	duration -= time.time()
	print(f"Starting at {time.time()}")
	encrypted_prediction = query(payload)
	print(f"Ending at {time.time()}")
	duration += time.time()

	print(f"{encrypted_prediction=}")

	encrypted_prediction = encrypted_prediction

	if is_first:
	is_first = False
	print(f"Size of the payload: {sys.getsizeof(payload)} bytes")

	# Decrypt the result and dequantize
	prediction_proba = fhemodel_client.deserialize_decrypt_dequantize(encrypted_prediction)[0]
	prediction = np.argmax(prediction_proba)

	if verbose or True:
	print(f"for {i}-th input, {prediction=} with expected {y_test[i]}")

	# Measure accuracy
	nb_good += y_test[i] == prediction

	print(f"Accuracy on {nb_samples} samples is {nb_good * 1. / nb_samples}")
	print(f"Total time: {time.time() - time_start} seconds")
	print(f"Duration in inferences: {duration} seconds")
	print(f"Duration per inference: {duration / nb_samples} seconds")