Spaces:

mateoluksenberg
/

chat

Running

App Files Files Community

mateoluksenberg commited on Aug 7, 2024

Commit

7104c5d

verified ·

1 Parent(s): 2a0024c

Update app.py

Browse files

Files changed (1) hide show

app.py +9 -30

app.py CHANGED Viewed

@@ -117,44 +117,26 @@ def extract_pptx(path):
 #         raise gr.Error("Oops, unsupported files.")
 def mode_load(file_obj):
-    # Intenta detectar el tipo de archivo basado en su contenido
     try:
         file_obj.seek(0)  # Asegúrate de que el puntero esté al inicio del archivo
-        # Verifica si es PDF
-        if file_obj.read(4) == b'%PDF':
-            file_obj.seek(0)  # Vuelve al inicio del archivo para procesar
             content = extract_pdf(file_obj)
             choice = "doc"
         elif file_obj.name.endswith(".docx"):
-            file_obj.seek(0)
             content = extract_docx(file_obj)
             choice = "doc"
         elif file_obj.name.endswith(".pptx"):
-            file_obj.seek(0)
             content = extract_pptx(file_obj)
             choice = "doc"
-        elif file_obj.name.endswith(".txt"):
-            file_obj.seek(0)
-            content = file_obj.read().decode('utf-8', errors='ignore')
-            choice = "doc"
-        elif file_obj.name.endswith(".py"):
-            file_obj.seek(0)
-            content = file_obj.read().decode('utf-8', errors='ignore')
-            choice = "doc"
-        elif file_obj.name.endswith(".json"):
-            file_obj.seek(0)
-            content = file_obj.read().decode('utf-8', errors='ignore')
-            choice = "doc"
-        elif file_obj.name.endswith(".cpp"):
-            file_obj.seek(0)
-            content = file_obj.read().decode('utf-8', errors='ignore')
-            choice = "doc"
-        elif file_obj.name.endswith(".md"):
-            file_obj.seek(0)
             content = file_obj.read().decode('utf-8', errors='ignore')
             choice = "doc"
         elif file_obj.name.endswith((".png", ".jpg", ".jpeg", ".bmp", ".tiff", ".webp")):
-            file_obj.seek(0)
             content = Image.open(file_obj).convert('RGB')
             choice = "image"
         else:
@@ -329,11 +311,8 @@ def simple_chat(message: dict, temperature: float = 0.8, max_length: int = 4096,
         conversation = []
         if "file" in message and message["file"]:
-            # Lee el contenido del archivo como bytes
-            file_contents = io.BytesIO(message["file"]).read()
-            # Convierte los bytes a una cadena si `mode_load` espera texto
-            file_contents_str = file_contents.decode('utf-8', errors='ignore')
-            choice, contents = mode_load(file_contents_str)
             if choice == "image":
                 conversation.append({"role": "user", "image": contents, "content": message["text"]})
             elif choice == "doc":

 #         raise gr.Error("Oops, unsupported files.")
 def mode_load(file_obj):
     try:
         file_obj.seek(0)  # Asegúrate de que el puntero esté al inicio del archivo
+        # Detecta el tipo de archivo basándote en los primeros bytes si es posible
+        file_header = file_obj.read(4)
+        file_obj.seek(0)  # Vuelve al inicio del archivo para procesamiento completo
+        if file_header.startswith(b'%PDF'):
             content = extract_pdf(file_obj)
             choice = "doc"
         elif file_obj.name.endswith(".docx"):
             content = extract_docx(file_obj)
             choice = "doc"
         elif file_obj.name.endswith(".pptx"):
             content = extract_pptx(file_obj)
             choice = "doc"
+        elif file_obj.name.endswith(".txt") or file_obj.name.endswith(".py") or file_obj.name.endswith(".json") or file_obj.name.endswith(".cpp") or file_obj.name.endswith(".md"):
             content = file_obj.read().decode('utf-8', errors='ignore')
             choice = "doc"
         elif file_obj.name.endswith((".png", ".jpg", ".jpeg", ".bmp", ".tiff", ".webp")):
             content = Image.open(file_obj).convert('RGB')
             choice = "image"
         else:
         conversation = []
         if "file" in message and message["file"]:
+            file_contents = io.BytesIO(message["file"])  # Asegúrate de que sea un objeto BytesIO
+            choice, contents = mode_load(file_contents)
             if choice == "image":
                 conversation.append({"role": "user", "image": contents, "content": message["text"]})
             elif choice == "doc":