Spaces:

Lap1official
/

API

Running

App Files Files Community

API / app.py

Reality123b

Update app.py

9d0ab74 verified 5 months ago

raw

history blame

7.21 kB

	import gradio as gr
	from huggingface_hub import InferenceClient
	from deep_translator import GoogleTranslator
	from indic_transliteration import sanscript
	from indic_transliteration.detect import detect as detect_script
	from indic_transliteration.sanscript import transliterate
	import langdetect
	import re
	import requests
	import json
	import base64
	from PIL import Image
	import io
	import time

	# Initialize clients
	text_client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
	SPACE_URL = "https://ijohn07-dalle-4k.hf.space"

	# Add image style options
	IMAGE_STYLES = {
	"3840 x 2160": "3840 x 2160",
	"2560 x 1440": "2560 x 1440",
	"Photo": "Photo",
	"Cinematic": "Cinematic",
	"Anime": "Anime",
	"3D Model": "3D Model",
	"No style": "(No style)"
	}

	def generate_image_space(prompt: str, style: str) -> Image.Image:
	"""Generate an image using the DALLE-4K Space with specified style."""
	try:
	# First get the session hash
	response = requests.post(f"{SPACE_URL}/queue/join")
	session_hash = response.json().get('session_hash')

	# Modify prompt based on style
	if style != "(No style)":
	# Format the prompt according to the style
	if style in ["3840 x 2160", "2560 x 1440"]:
	# For resolution styles, add the resolution to the prompt
	prompt = f"{prompt}, {style} resolution"
	else:
	# For other styles, append the style to the prompt
	prompt = f"{prompt}, {style.lower()} style"

	# Send the generation request
	response = requests.post(f"{SPACE_URL}/run/predict", json={
	"data": [
	prompt, # Prompt with style
	"", # Negative prompt
	7.5, # Guidance scale
	30, # Steps
	"DPM++ SDE Karras", # Scheduler
	False, # High resolution
	False, # Image to image
	None, # Image upload
	1 # Batch size
	],
	"session_hash": session_hash
	})

	# Poll for results
	while True:
	status_response = requests.post(f"{SPACE_URL}/queue/status", json={
	"session_hash": session_hash
	})
	status_data = status_response.json()

	if status_data.get('status') == 'complete':
	# Get the image data
	image_data = status_data['data']['image']
	# Convert base64 to PIL Image
	image_bytes = base64.b64decode(image_data.split(',')[1])
	image = Image.open(io.BytesIO(image_bytes))
	return image
	elif status_data.get('status') == 'error':
	raise Exception(f"Image generation failed: {status_data.get('error')}")

	time.sleep(1) # Wait before polling again

	except Exception as e:
	print(f"Image generation error: {e}")
	return None

	def romanized_to_bengali(text: str) -> str:
	"""Convert romanized Bengali text to Bengali script."""
	bengali_mappings = {
	'ami': 'আমি',
	'tumi': 'তুমি',
	'apni': 'আপনি',
	'kemon': 'কেমন',
	'achen': 'আছেন',
	'acchen': 'আছেন',
	'bhalo': 'ভালো',
	'achi': 'আছি',
	'ki': 'কি',
	'kothay': 'কোথায়',
	'keno': 'কেন',
	}

	text_lower = text.lower()
	for roman, bengali in bengali_mappings.items():
	text_lower = re.sub(r'\b' + roman + r'\b', bengali, text_lower)

	if text_lower == text.lower():
	try:
	return transliterate(text, sanscript.ITRANS, sanscript.BENGALI)
	except:
	return text

	return text_lower

	def respond(
	message,
	history: list[tuple[str, str]],
	system_message,
	max_tokens,
	temperature,
	top_p,
	image_style: str, # New parameter for image style
	):
	# First check for custom responses
	custom_response = check_custom_responses(message)
	if custom_response:
	yield custom_response
	return

	# Check if this is an image generation request
	if is_image_request(message):
	try:
	image = generate_image_space(message, image_style)
	if image:
	style_info = f" using {image_style} style" if image_style != "(No style)" else ""
	yield (image, f"Here's your generated image based on: {message}{style_info}")
	return
	else:
	yield "Sorry, I couldn't generate the image. Please try again."
	return
	except Exception as e:
	yield f"An error occurred while generating the image: {str(e)}"
	return

	# Rest of the code remains the same...
	translated_msg, original_lang, was_transliterated = translate_text(message)
	messages = [{"role": "system", "content": system_message}]
	for val in history:
	if val[0]:
	if len(val[0].split()) > 2:
	trans_user_msg, _, _ = translate_text(val[0])
	messages.append({"role": "user", "content": trans_user_msg})
	else:
	messages.append({"role": "user", "content": val[0]})
	if val[1]:
	messages.append({"role": "assistant", "content": val[1]})

	messages.append({"role": "user", "content": translated_msg})

	response = ""
	for message in text_client.chat_completion(
	messages,
	max_tokens=max_tokens,
	stream=True,
	temperature=temperature,
	top_p=top_p,
	):
	token = message.choices[0].delta.content
	response += token

	if original_lang != 'en' and len(message.split()) > 2:
	try:
	translator = GoogleTranslator(source='en', target=original_lang)
	translated_response = translator.translate(response)
	yield translated_response
	except:
	yield response
	else:
	yield response

	# Updated Gradio interface with image style selector
	demo = gr.ChatInterface(
	respond,
	additional_inputs=[
	gr.Textbox(
	value="You are a friendly Chatbot who always responds in English unless the user specifically uses another language.",
	label="System message"
	),
	gr.Slider(
	minimum=1,
	maximum=2048,
	value=2048,
	step=1,
	label="Max new tokens"
	),
	gr.Slider(
	minimum=0.1,
	maximum=4.0,
	value=0.7,
	step=0.1,
	label="Temperature"
	),
	gr.Slider(
	minimum=0.1,
	maximum=1.0,
	value=0.95,
	step=0.05,
	label="Top-p (nucleus sampling)"
	),
	gr.Radio(
	choices=list(IMAGE_STYLES.values()),
	value="3840 x 2160",
	label="Image Style",
	info="Select the style for generated images"
	),
	]
	)

	if __name__ == "__main__":
	demo.launch(share=True)