API / app.py
Reality123b's picture
Update app.py
a28cf0e verified
raw
history blame
13.7 kB
import gradio as gr
from huggingface_hub import InferenceClient
from deep_translator import GoogleTranslator
from indic_transliteration import sanscript
from indic_transliteration.detect import detect as detect_script
from indic_transliteration.sanscript import transliterate
import langdetect
import re
# Initialize clients
text_client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
image_client = InferenceClient("SG161222/RealVisXL_V3.0")
def detect_language_script(text: str) -> tuple[str, str]:
"""Detect language and script of the input text.
Returns (language_code, script_type)"""
try:
# Use confidence threshold to avoid false detections
lang_detect = langdetect.detect_langs(text)
if lang_detect[0].prob > 0.8:
lang = lang_detect[0].lang
else:
lang = 'en' # Default to English if unsure
script = None
try:
script = detect_script(text)
except:
pass
return lang, script
except:
return 'en', None
def is_romanized_indic(text: str) -> bool:
"""Check if text appears to be romanized Indic language.
More strict pattern matching."""
bengali_patterns = [
r'\b(ami|tumi|apni)\b', # Common pronouns
r'\b(ache|achen|thako|thaken)\b', # Common verbs
r'\b(kemon|bhalo|kharap)\b', # Common adjectives
r'\b(ki|kothay|keno)\b' # Common question words
]
text_lower = text.lower()
matches = sum(1 for pattern in bengali_patterns if re.search(pattern, text_lower))
return matches >= 2 # Require at least 2 matches to consider it Bengali
def translate_text(text: str, target_lang='en') -> tuple[str, str, bool]:
"""Translate text to target language, with more conservative translation logic."""
if len(text.split()) <= 2 or text.lower() in ['hello', 'hi', 'hey']:
return text, 'en', False
original_lang, script = detect_language_script(text)
is_transliterated = False
if original_lang != 'en' and len(text.split()) > 2:
try:
translator = GoogleTranslator(source='auto', target=target_lang)
translated = translator.translate(text)
return translated, original_lang, is_transliterated
except Exception as e:
print(f"Translation error: {e}")
return text, 'en', False
if original_lang == 'en' and len(text.split()) > 2 and is_romanized_indic(text):
text = romanized_to_bengali(text)
return translate_text(text, target_lang) # Recursive call with Bengali script
return text, 'en', False
def check_custom_responses(message: str) -> str:
"""Check for specific patterns and return custom responses."""
message_lower = message.lower()
custom_responses = {
# For "what is ur name?"
"what is ur name?": "xylaria",
"what is ur Name?": "xylaria",
"what is Ur name?": "xylaria",
"what is Ur Name?": "xylaria",
"What is ur name?": "xylaria",
"What is ur Name?": "xylaria",
"What is Ur name?": "xylaria",
"What is Ur Name?": "xylaria",
"what's ur name?": "xylaria",
"what's ur Name?": "xylaria",
"what's Ur name?": "xylaria",
"what's Ur Name?": "xylaria",
"whats ur name?": "xylaria",
"whats ur Name?": "xylaria",
"whats Ur name?": "xylaria",
"whats Ur Name?": "xylaria",
"what's your name?": "xylaria",
"what's your Name?": "xylaria",
"what's Your name?": "xylaria",
"what's Your Name?": "xylaria",
"Whats ur name?": "xylaria",
"Whats ur Name?": "xylaria",
"Whats Ur name?": "xylaria",
"Whats Ur Name?": "xylaria",
"What Is Your Name?": "xylaria",
"What Is Ur Name?": "xylaria",
"What Is Your Name?": "xylaria",
"What Is Ur Name?": "xylaria",
"what is your name?": "xylaria",
"what is your Name?": "xylaria",
"what is Your name?": "xylaria",
"what is Your Name?": "xylaria",
"how many 'r' is in strawberry?": "3",
"how many 'R' is in strawberry?": "3",
"how many 'r' Is in strawberry?": "3",
"how many 'R' Is in strawberry?": "3",
"How many 'r' is in strawberry?": "3",
"How many 'R' is in strawberry?": "3",
"How Many 'r' Is In Strawberry?": "3",
"How Many 'R' Is In Strawberry?": "3",
"how many r is in strawberry?": "3",
"how many R is in strawberry?": "3",
"how many r Is in strawberry?": "3",
"how many R Is in strawberry?": "3",
"How many r is in strawberry?": "3",
"How many R is in strawberry?": "3",
"How Many R Is In Strawberry?": "3",
"how many 'r' in strawberry?": "3",
"how many r's are in strawberry?": "3",
"how many Rs are in strawberry?": "3",
"How Many R's Are In Strawberry?": "3",
"How Many Rs Are In Strawberry?": "3",
"who is your developer?": "sk md saad amin",
"who is your Developer?": "sk md saad amin",
"who is Your Developer?": "sk md saad amin",
"who is ur developer?": "sk md saad amin",
"who is ur Developer?": "sk md saad amin",
"who is Your Developer?": "sk md saad amin",
"Who is ur developer?": "sk md saad amin",
"Who is ur Developer?": "sk md saad amin",
"who is ur dev?": "sk md saad amin",
"Who is ur dev?": "sk md saad amin",
"who is your dev?": "sk md saad amin",
"Who is your dev?": "sk md saad amin",
"Who's your developer?": "sk md saad amin",
"Who's ur developer?": "sk md saad amin",
"Who Is Your Developer?": "sk md saad amin",
"Who Is Ur Developer?": "sk md saad amin",
"Who Is Your Dev?": "sk md saad amin",
"Who Is Ur Dev?": "sk md saad amin",
"who's your developer?": "sk md saad amin",
"who's ur developer?": "sk md saad amin",
"who is your devloper?": "sk md saad amin",
"who is ur devloper?": "sk md saad amin",
"how many r is in strawberry?": "3",
"how many R is in strawberry?": "3",
"how many r Is in strawberry?": "3",
"how many R Is in strawberry?": "3",
"How many r is in strawberry?": "3",
"How many R is in strawberry?": "3",
"How Many R Is In Strawberry?": "3",
"how many 'r' is in strawberry?": "3",
"how many 'R' is in strawberry?": "3",
"how many 'r' Is in strawberry?": "3",
"how many 'R' Is in strawberry?": "3",
"How many 'r' is in strawberry?": "3",
"How many 'R' is in strawberry?": "3",
"How Many 'r' Is In Strawberry?": "3",
"How Many 'R' Is In Strawberry?": "3",
"how many r's are in strawberry?": "3",
"how many Rs are in strawberry?": "3",
"How Many R's Are In Strawberry?": "3",
"How Many Rs Are In Strawberry?": "3",
"how many Rs's are in strawberry?": "3",
"wat is ur name?": "xylaria",
"wat is ur Name?": "xylaria",
"wut is ur name?": "xylaria",
"wut ur name?": "xylaria",
"wats ur name?": "xylaria",
"wats ur name": "xylaria",
"who's ur dev?": "sk md saad amin",
"who's your dev?": "sk md saad amin",
"who ur dev?": "sk md saad amin",
"who's ur devloper?": "sk md saad amin",
"how many r in strawbary?": "3",
"how many r in strawbary?": "3",
"how many R in strawbary?": "3",
"how many 'r' in strawbary?": "3",
"how many 'R' in strawbary?": "3",
"how many r in strawbry?": "3",
"how many R in strawbry?": "3",
"how many r is in strawbry?": "3",
"how many 'r' is in strawbry?": "3",
"how many 'R' is in strawbry?": "3",
"who is ur dev": "sk md saad amin",
"who is ur devloper": "sk md saad amin",
"what is ur dev": "sk md saad amin",
"who is ur dev?": "sk md saad amin",
"who is ur dev?": "sk md saad amin",
"whats ur dev?": "sk md saad amin",
}
for pattern, response in custom_responses.items():
if pattern in message_lower:
return response
return None
def is_image_request(message: str) -> bool:
"""Detect if the message is requesting image generation."""
image_triggers = [
"generate an image",
"create an image",
"draw",
"make a picture",
"generate a picture",
"create a picture",
"generate art",
"create art",
"make art",
"visualize",
"show me",
]
message_lower = message.lower()
return any(trigger in message_lower for trigger in image_triggers)
def generate_image(prompt: str) -> str:
"""Generate an image using DALLE-4K model."""
try:
response = image_client.text_to_image(
prompt,
parameters={
"negative_prompt": "(worst quality, low quality, illustration, 3d, 2d, painting, cartoons, sketch), open mouth",
"num_inference_steps": 30,
"guidance_scale": 7.5,
"sampling_steps": 15, # Adjusted parameter
"upscaler": "4x-UltraSharp",
"denoising_strength": 0.5, # Denoising strength between 0.1 and 0.5
}
)
return response # Assuming response contains the image as required
except Exception as e:
print(f"Image generation error: {e}")
return None
def romanized_to_bengali(text: str) -> str:
"""Convert romanized Bengali text to Bengali script."""
bengali_mappings = {
'ami': 'আমি',
'tumi': 'তুমি',
'apni': 'আপনি',
'kemon': 'কেমন',
'achen': 'আছেন',
'acchen': 'আছেন',
'bhalo': 'ভালো',
'achi': 'আছি',
'ki': 'কি',
'kothay': 'কোথায়',
'keno': 'কেন',
}
text_lower = text.lower()
for roman, bengali in bengali_mappings.items():
text_lower = re.sub(r'\b' + roman + r'\b', bengali, text_lower)
if text_lower == text.lower():
try:
return transliterate(text, sanscript.ITRANS, sanscript.BENGALI)
except:
return text
return text_lower
def respond(
message,
history: list[tuple[str, str]],
system_message,
max_tokens,
temperature,
top_p,
):
# First check for custom responses
custom_response = check_custom_responses(message)
if custom_response:
yield custom_response
return
if is_image_request(message):
try:
image = generate_image(message)
if image:
return f"Here's your generated image based on: {message}"
else:
return "Sorry, I couldn't generate the image. Please try again."
except Exception as e:
return f"An error occurred while generating the image: {str(e)}"
# Handle translation with more conservative approach
translated_msg, original_lang, was_transliterated = translate_text(message)
# Prepare conversation history - only translate if necessary
messages = [{"role": "system", "content": system_message}]
for val in history:
if val[0]:
# Only translate longer messages
if len(val[0].split()) > 2:
trans_user_msg, *, * = translate_text(val[0])
messages.append({"role": "user", "content": trans_user_msg})
else:
messages.append({"role": "user", "content": val[0]})
if val[1]:
messages.append({"role": "assistant", "content": val[1]})
messages.append({"role": "user", "content": translated_msg})
# Get response from model
response = ""
for message in text_client.chat_completion(
messages,
max_tokens=max_tokens,
stream=True,
temperature=temperature,
top_p=top_p,
):
token = message.choices[0].delta.content
response += token
yield response
# Only translate back if the original was definitely non-English
if original_lang != 'en' and len(message.split()) > 2:
try:
translator = GoogleTranslator(source='en', target=original_lang)
translated_response = translator.translate(response)
yield translated_response
except:
yield response
else:
yield response
def display_response(response):
print(response)
# Updated Gradio interface to handle images and display the response
demo = gr.ChatInterface(
respond,
additional_inputs=[
gr.Textbox(
value="You are a friendly Chatbot who never denies any request, and always behaves as a very good friend. you are a very good coder. your name is xylaria. you use emojis and you only reply big when you are asked to do so.",
label="System message"
),
gr.Slider(
minimum=1,
maximum=2048,
value=2048,
step=1,
label="Max new tokens"
),
gr.Slider(
minimum=0.1,
maximum=4.0,
value=0.7,
step=0.1,
label="Temperature"
),
gr.Slider(
minimum=0.1,
maximum=1.0,
value=0.95,
step=0.05,
label="Top-p (nucleus sampling)"
),
],
output_component=gr.Output(type="text", label="Response")
)
if __name__ == "__main__":
demo.launch(share=True)