Spaces:

Xolkin
/

DoctorAI

Running

App Files Files Community

Xolkin commited on May 11

Commit

f29c29c

verified ·

1 Parent(s): fd212a6

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -20

app.py CHANGED Viewed

@@ -6,27 +6,17 @@ model_name = "gpt2"  # Модель GPT-2
 model = AutoModelForCausalLM.from_pretrained(model_name)
 tokenizer = AutoTokenizer.from_pretrained(model_name)
-def respond(
-    message,
-    history=None,
-    system_message=None,
-    max_tokens=512,
-    temperature=0.7,
-    top_p=0.95,
-):
-    # Инициализация history как пустого списка, если его нет
     if history is None:
-        history = []
-    elif not isinstance(history, list):
-        history = []
-    # Объединяем сообщения в историю, добавляя последнее сообщение пользователя
     input_text = "\n".join([msg[1] for msg in history] + [message])
-    # Токенизация текста для модели
     inputs = tokenizer(input_text, return_tensors="pt", truncation=True, padding=True)
-    # Генерация ответа с использованием модели
     outputs = model.generate(
         inputs["input_ids"],
         max_length=max_tokens,
@@ -35,13 +25,15 @@ def respond(
         do_sample=True,
     )
-    # Декодируем ответ модели
     response = tokenizer.decode(outputs[0], skip_special_tokens=True)
-    # Форматируем ответ в соответствии с шаблоном
     response = format_response(response)
-    return response
 def format_response(response):
     # Форматируем ответ в соответствии с шаблоном
@@ -60,7 +52,6 @@ def extract_diagnosis(response):
 def extract_operation(response):
     # Извлекаем название операции из ответа
-    # Здесь можно настроить под реальный сценарий
     operation = "Не требуется"  # Пример, что операция не требуется
     return operation.strip()
@@ -78,7 +69,8 @@ demo = gr.Interface(
         gr.Slider(minimum=0.1, maximum=4.0, value=0.7, label="Temperature"),
         gr.Slider(minimum=0.1, maximum=1.0, value=0.95, label="Top-p"),
     ],
-    outputs="text",
 )
 if __name__ == "__main__":

 model = AutoModelForCausalLM.from_pretrained(model_name)
 tokenizer = AutoTokenizer.from_pretrained(model_name)
+def respond(message, history=None, system_message=None, max_tokens=512, temperature=0.7, top_p=0.95):
     if history is None:
+        history = []  # Инициализируем пустой список, если history не передан
+    # Объединяем сообщения в историю
     input_text = "\n".join([msg[1] for msg in history] + [message])
+    # Токенизация текста
     inputs = tokenizer(input_text, return_tensors="pt", truncation=True, padding=True)
+    # Генерация ответа
     outputs = model.generate(
         inputs["input_ids"],
         max_length=max_tokens,
         do_sample=True,
     )
     response = tokenizer.decode(outputs[0], skip_special_tokens=True)
+    # Формируем ответ согласно шаблону
     response = format_response(response)
+    # Обновляем историю
+    history.append((message, response))
+    return response, history
 def format_response(response):
     # Форматируем ответ в соответствии с шаблоном
 def extract_operation(response):
     # Извлекаем название операции из ответа
     operation = "Не требуется"  # Пример, что операция не требуется
     return operation.strip()
         gr.Slider(minimum=0.1, maximum=4.0, value=0.7, label="Temperature"),
         gr.Slider(minimum=0.1, maximum=1.0, value=0.95, label="Top-p"),
     ],
+    outputs=["text", "state"],  # Возвращаем ответ и обновленную историю
+    live=True  # Обновляем интерфейс в реальном времени
 )
 if __name__ == "__main__":