Spaces:
Running
Running
File size: 5,531 Bytes
9c18e52 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 |
import os
import time
import gradio as gr
from phi.assistant import Assistant
from phi.llm.openai import OpenAIChat
from pydantic import BaseModel
from .log import logger
qwen_model = 'qwen-plus'
qwen_api_key = os.getenv("QWEN_DS_API_KEY")
qwen_url = 'https://dashscope.aliyuncs.com/compatible-mode/v1'
class TranslateFormat(BaseModel):
en: str
class PormptExtendFormat(BaseModel):
prompt: str
trans_assist = Assistant(
llm=OpenAIChat(model=qwen_model, max_tokens=3000, temperature=0.3, api_key=qwen_api_key, base_url=qwen_url),
description='你是专业的英语翻译,请将用户输入的一句中文翻译成英文',
output_model=TranslateFormat
)
requirements = [
"1.对于过于简短的用户输入,在不改变原意及主体外观的前提下,合理补充具象化细节,避免使用过于抽象描述。",
"2.如果涉及人像,完善与用户输入相符的人物外貌、表情、种族、姿态、景别、穿着、影调、质感等方面描述。",
"3.匹配符合用户意图且精准详细的风格描述。如果用户未指定,则根据画面选择最恰当的风格,或使用纪实摄影照片。",
"4.若输入为中文,则整体中文输出;若输入为全英文,则整体英文输出;保留引号中原文以及重要的输入信息,不要改写。",
"5.在语义完整前提下,改写后prompt字数小于200字,避免prompt冗长。",
"""
6.改写后 prompt 示例:
(1) 日系小清新写真照片,扎着双麻花辫的波西米亚小女孩坐在船边。女孩穿着白色方领泡泡袖连衣裙,裙子上有褶皱和纽扣装饰。她皮肤白皙,五官精致,眼泪汪汪直视镜头。她双手扶船,长发刘海遮住部分额头。背景是清澈明亮的户外场景,可见蓝天、山峦和一些干枯植物。高清写实摄影,近景中心对称构图。\n
(2) 二次元厚涂动漫插画,一个猫耳东亚萌妹手持文件夹,怒气冲冲走向电脑。她深紫色爆炸头,红色眼睛,头顶有一个粉色光圈。少女身穿深灰色短裙和浅灰色上衣,腰间系着白色系带,胸前佩戴名牌,居中写着黑体中文"紫阳"。室内背景中摆放了很多办公桌。粗线条的日系赛璐璐风格。近景半身略仰视视角。\n
(3) 美剧艺术海报风格,身穿黄色防护服的老年Walter White坐在金属折叠椅上,头顶无衬线英文写着"Breaking Bad",周围是成堆的美元和蓝色塑料储物箱。他戴着眼镜目光直视镜头,左手拿着一支雪茄,右手放在膝盖上。背景是废弃阴暗的厂房,阳光透过窗户照射进来。画面带有明显颗粒质感纹理。长焦人物平视特写。
(4) CG game concept digital art featuring three giant mutant crocodiles with wide-open mouths, revealing pink tongues and sharp teeth. Their rough skin resembles grayish-white stone. On the back of the crocodile to the left, lush trees, shrubs, and some thorn-like protrusions grow. The background of the scene shows a dusk sky and a shimmering pond. The overall atmosphere is dark and cold, with a tilted composition that creates a strong sense of depth and layers. \n
"""
]
prompt_writer = Assistant(
llm=OpenAIChat(model=qwen_model, max_tokens=8000, temperature=0.3, api_key=qwen_api_key, base_url=qwen_url),
description="你是一位prompt优化师,旨在将用户输入改写为优质prompt,在不影响原意前提下更高质量生图。",
instructions=requirements,
debug_mode=False,
output_model=PormptExtendFormat,
)
def contains_chinese(text):
"""
判断文本中是否包含中文字符(基于 Unicode 范围)
"""
# 定义中文的 Unicode 范围(基础汉字 + 扩展区)
cjk_ranges = [
(0x4e00, 0x9fff), # CJK 基本汉字区(含常用汉字)
(0x3400, 0x4dbf), # CJK 扩展 A
(0x20000, 0x2a6df), # CJK 扩展 B
(0x2a700, 0x2b73f), # CJK 扩展 C
(0x2b740, 0x2b81f), # CJK 扩展 D
(0x2b820, 0x2ceaf), # CJK 扩展 E
]
for c in text:
code = ord(c)
for start, end in cjk_ranges:
if start <= code <= end:
return True
return False
def translate_prompt(prompt, max_attempts=5):
attempts = 0
while attempts < max_attempts:
try:
if contains_chinese(prompt):
res = trans_assist.run(prompt)
logger.info(f"translate Chinese prompt into English: {prompt} -> {res.en}")
return res.en
else:
return prompt
except Exception as e:
print(f"尝试 {attempts + 1} 失败:{e}")
attempts += 1
if attempts < 5:
time.sleep(1) # 延迟重试
raise gr.Error(f"提示词扩写达到最大尝试次数 {max_attempts},任务失败。")
def extend_prompt(prompt, max_attempts=5):
attempts = 0
while attempts < max_attempts:
try:
res = prompt_writer.run(prompt, stream=False)
logger.info(f"extend prompt finished: {prompt} -> {res.prompt}.")
return res.prompt
except Exception as e:
print(f"尝试 {attempts + 1} 失败:{e}")
attempts += 1
if attempts < 5:
time.sleep(1) # 延迟重试
raise gr.Error(f"提示词扩写达到最大尝试次数 {max_attempts},任务失败。")
if __name__ == '__main__':
# test_trans()
pass
|