Spaces:

Segizu
/

Face_Recognition

Build error

App Files Files Community

Segizu commited on May 8

Commit

6773de5

1 Parent(s): d3af2e5

metadata v12

Browse files

Files changed (1) hide show

app.py +27 -33

app.py CHANGED Viewed

@@ -8,25 +8,24 @@ import pickle
 from pathlib import Path
 import gc
-# 🔐 Token automático (si es necesario)
-HF_TOKEN = os.getenv("HF_TOKEN")
-# 📁 Directorio para embeddings
 EMBEDDINGS_DIR = Path("embeddings")
 EMBEDDINGS_DIR.mkdir(exist_ok=True)
 EMBEDDINGS_FILE = EMBEDDINGS_DIR / "embeddings.pkl"
-# ✅ Cargar dataset directamente desde Hugging Face Hub
 dataset = load_dataset(
     "csv",
     data_files="metadata.csv",
-    split="train",
-)
 print("✅ Primer item:", dataset[0])
 dataset = dataset.cast_column("image", HfImage())
-# 🔄 Preprocesar imagen para Facenet
 def preprocess_image(img: Image.Image) -> np.ndarray:
     img_rgb = img.convert("RGB")
     img_resized = img_rgb.resize((160, 160), Image.Resampling.LANCZOS)
@@ -35,11 +34,11 @@ def preprocess_image(img: Image.Image) -> np.ndarray:
 # 📦 Construir base de datos de embeddings
 def build_database():
     if EMBEDDINGS_FILE.exists():
-        print("📂 Cargando embeddings desde el archivo...")
-        with open(EMBEDDINGS_FILE, 'rb') as f:
             return pickle.load(f)
-    print("🔄 Calculando embeddings (esto puede tomar unos minutos)...")
     database = []
     batch_size = 10
@@ -47,15 +46,10 @@ def build_database():
         batch = dataset[i:i + batch_size]
         print(f"📦 Procesando lote {i // batch_size + 1}/{(len(dataset) + batch_size - 1) // batch_size}")
-        for j, item in enumerate(batch):
             try:
-                if not isinstance(item, dict) or "image" not in item:
-                    print(f"⚠️ Saltando item {i+j} - estructura inválida: {item}")
-                    continue
-                img = item["image"]
                 if not isinstance(img, Image.Image):
-                    print(f"⚠️ Saltando item {i+j} - no es imagen: {type(img)}")
                     continue
                 img_processed = preprocess_image(img)
@@ -65,20 +59,20 @@ def build_database():
                     enforce_detection=False
                 )[0]["embedding"]
-                database.append((f"image_{i+j}", img, embedding))
-                print(f"✅ Procesada imagen {i+j+1}/{len(dataset)}")
                 del img_processed
                 gc.collect()
             except Exception as e:
-                print(f"❌ Error al procesar imagen {i+j}: {str(e)}")
                 continue
-        # Guardar después de cada lote
         if database:
-            print("💾 Guardando progreso...")
-            with open(EMBEDDINGS_FILE, 'wb') as f:
                 pickle.dump(database, f)
         gc.collect()
@@ -97,8 +91,8 @@ def find_similar_faces(uploaded_image: Image.Image):
         del img_processed
         gc.collect()
     except Exception as e:
-        print(f"Error al procesar imagen de consulta: {str(e)}")
-        return [], "⚠ No se detectó un rostro válido en la imagen."
     similarities = []
     for name, db_img, embedding in database:
@@ -110,18 +104,18 @@ def find_similar_faces(uploaded_image: Image.Image):
     top_matches = similarities[:5]
     gallery_items = []
-    text_summary = ""
     for sim, name, img in top_matches:
         caption = f"{name} - Similitud: {sim:.2f}"
         gallery_items.append((img, caption))
-        text_summary += caption + "\n"
-    return gallery_items, text_summary
-# ⚙️ Iniciar la aplicación
 print("🚀 Iniciando aplicación...")
 database = build_database()
-print(f"✅ Base de datos cargada con {len(database)} imágenes")
 # 🎛️ Interfaz Gradio
 demo = gr.Interface(
@@ -129,10 +123,10 @@ demo = gr.Interface(
     inputs=gr.Image(label="📤 Sube una imagen", type="pil"),
     outputs=[
         gr.Gallery(label="📸 Rostros más similares"),
-        gr.Textbox(label="🧠 Similitud", lines=6)
     ],
     title="🔍 Buscador de Rostros con DeepFace",
-    description="Sube una imagen y se comparará contra los rostros del dataset alojado en Hugging Face (`Segizu/facial-recognition`)."
 )
 demo.launch()

 from pathlib import Path
 import gc
+# 📁 Directorio para almacenar embeddings
 EMBEDDINGS_DIR = Path("embeddings")
 EMBEDDINGS_DIR.mkdir(exist_ok=True)
 EMBEDDINGS_FILE = EMBEDDINGS_DIR / "embeddings.pkl"
+# ✅ Cargar dataset desde metadata.csv (con URLs absolutas)
 dataset = load_dataset(
     "csv",
     data_files="metadata.csv",
+    split="train"
+)
 print("✅ Primer item:", dataset[0])
+# 🖼️ Convertir columna a imágenes usando HfImage (PIL)
 dataset = dataset.cast_column("image", HfImage())
+# 🔄 Preprocesar imagen para DeepFace
 def preprocess_image(img: Image.Image) -> np.ndarray:
     img_rgb = img.convert("RGB")
     img_resized = img_rgb.resize((160, 160), Image.Resampling.LANCZOS)
 # 📦 Construir base de datos de embeddings
 def build_database():
     if EMBEDDINGS_FILE.exists():
+        print("📂 Cargando embeddings desde archivo...")
+        with open(EMBEDDINGS_FILE, "rb") as f:
             return pickle.load(f)
+    print("🔄 Calculando embeddings...")
     database = []
     batch_size = 10
         batch = dataset[i:i + batch_size]
         print(f"📦 Procesando lote {i // batch_size + 1}/{(len(dataset) + batch_size - 1) // batch_size}")
+        for j, img in enumerate(batch):
             try:
                 if not isinstance(img, Image.Image):
+                    print(f"⚠️ Saltando item {i + j} - no es imagen: {type(img)}")
                     continue
                 img_processed = preprocess_image(img)
                     enforce_detection=False
                 )[0]["embedding"]
+                database.append((f"image_{i + j}", img, embedding))
+                print(f"✅ Procesada imagen {i + j + 1}/{len(dataset)}")
                 del img_processed
                 gc.collect()
             except Exception as e:
+                print(f"❌ Error al procesar imagen {i + j}: {str(e)}")
                 continue
+        # Guardar después de cada batch
         if database:
+            print("💾 Guardando embeddings...")
+            with open(EMBEDDINGS_FILE, "wb") as f:
                 pickle.dump(database, f)
         gc.collect()
         del img_processed
         gc.collect()
     except Exception as e:
+        print(f"Error al procesar imagen de entrada: {str(e)}")
+        return [], "⚠ No se detectó un rostro válido."
     similarities = []
     for name, db_img, embedding in database:
     top_matches = similarities[:5]
     gallery_items = []
+    summary = ""
     for sim, name, img in top_matches:
         caption = f"{name} - Similitud: {sim:.2f}"
         gallery_items.append((img, caption))
+        summary += caption + "\n"
+    return gallery_items, summary
+# 🚀 Inicializar app
 print("🚀 Iniciando aplicación...")
 database = build_database()
+print(f"✅ Base cargada con {len(database)} imágenes.")
 # 🎛️ Interfaz Gradio
 demo = gr.Interface(
     inputs=gr.Image(label="📤 Sube una imagen", type="pil"),
     outputs=[
         gr.Gallery(label="📸 Rostros más similares"),
+        gr.Textbox(label="🧠 Resumen de similitud", lines=6)
     ],
     title="🔍 Buscador de Rostros con DeepFace",
+    description="Sube una imagen y se comparará contra los rostros del dataset `Segizu/facial-recognition`."
 )
 demo.launch()