Spaces:

wyyadd
/

facetype

Runtime error

App Files Files Community

wyyadd commited on Apr 11

Commit

2360da5

1 Parent(s): b19ada5

add model

Browse files

Files changed (5) hide show

.gitignore +2 -1
app.py +21 -0
main.py +23 -67
model.py +210 -0
requirements.txt +6 -1

.gitignore CHANGED Viewed

@@ -169,4 +169,5 @@ cython_debug/
 # PyPI configuration file
 .pypirc
-.idea/*

 # PyPI configuration file
 .pypirc
+.idea/*
+data

app.py ADDED Viewed

	@@ -0,0 +1,21 @@

+import gradio as gr
+from main import get_pred_binary
+from model import TARGET_LABELS
+def get_face_type(img):
+    pred_binary = get_pred_binary(img)
+    result = [f"{label}: {bool(pred)}" for label, pred in zip(TARGET_LABELS, pred_binary)]
+    face_type = int(''.join(map(str, pred_binary)), 2)
+    result = f"face_type: {face_type}\n{"\n".join(result)}"
+    return result
+demo = gr.Interface(
+    fn=get_face_type,
+    inputs=["image"],
+    outputs=["text"],
+)
+demo.launch()

main.py CHANGED Viewed

@@ -1,15 +1,19 @@
 import cv2
 import numpy as np
 import requests
 from deepface import DeepFace
 from fastapi import FastAPI, HTTPException
 app = FastAPI()
-np.random.seed(42)  # For reproducibility
-hyperplanes = np.random.randn(512, 5)
-# Optional: Normalize each hyperplane
-hyperplanes /= np.linalg.norm(hyperplanes, axis=0)
 @app.get("/face-type")
@@ -23,73 +27,25 @@ def get_face_type(url: str):
     except requests.exceptions.RequestException as e:
         raise HTTPException(status_code=400, detail=f"Failed to download image from URL: {str(e)}")
     try:
         embedding_objs = DeepFace.represent(
             img_path=img,
-            model_name="Facenet512")
     except Exception as e:
         raise HTTPException(status_code=500, detail="No face detected.")
-    ebd = np.array(embedding_objs[0]['embedding'], dtype=np.float32)
-    # Project vector onto hyperplanes
-    projections = np.dot(ebd, hyperplanes)
-    # Binarize (sign function)
-    bits = (projections >= 0).astype(int)
-    # Convert bits to integer (LSB first)
-    face_type = int(''.join(map(str, bits)), 2)
-    return {"face_type": face_type}
-# def get_face_type(file):
-#     try:
-#         attribute = DeepFace.analyze(
-#             img_path=file,
-#             actions=['age', 'gender'],
-#         )
-#         gender = attribute[0]['dominant_gender']
-#         age = attribute[0]['age']
-#         if gender == 'Man':
-#             if age < 10:
-#                 face_type = 7
-#             elif age < 20:
-#                 face_type = 3
-#             elif age < 30:
-#                 face_type = 12
-#             elif age < 40:
-#                 face_type = 1
-#             elif age < 50:
-#                 face_type = 15
-#             elif age < 60:
-#                 face_type = 5
-#             elif age < 70:
-#                 face_type = 10
-#             else:
-#                 face_type = 8
-#         elif gender == 'Woman':
-#             if age < 10:
-#                 face_type = 14
-#             elif age < 20:
-#                 face_type = 0
-#             elif age < 30:
-#                 face_type = 4
-#             elif age < 40:
-#                 face_type = 6
-#             elif age < 50:
-#                 face_type = 13
-#             elif age < 60:
-#                 face_type = 2
-#             elif age < 70:
-#                 face_type = 9
-#             else:
-#                 face_type = 11
-#         else:
-#             return "Face could not be detected."
-#         return f"face type:{face_type}---gender:{gender}---age:{age}"
-#     except Exception as e:
-#         print(e)
-#         return f"Face could not be detected."
-#
-#
-# if __name__ == '__main__':
-#     demo = gr.Interface(fn=get_new_face_type, inputs="image", outputs="label")
-#     demo.launch(share=False)

 import cv2
 import numpy as np
 import requests
+import torch
 from deepface import DeepFace
 from fastapi import FastAPI, HTTPException
+from model import MultiLabelClassifier
 app = FastAPI()
+model_path = "data/classifier.pth"
+model = MultiLabelClassifier(embedding_dim=4096, hidden_dim=1024)
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+model.load_state_dict(torch.load(model_path, weights_only=True))
+model.to(device).eval()
 @app.get("/face-type")
     except requests.exceptions.RequestException as e:
         raise HTTPException(status_code=400, detail=f"Failed to download image from URL: {str(e)}")
+    pred_binary = get_pred_binary(img)
+    face_type = int(''.join(map(str, pred_binary)), 2)
+    return {"face_type": face_type}
+def get_pred_binary(img: np.ndarray):
     try:
         embedding_objs = DeepFace.represent(
             img_path=img,
+            model_name="VGG-Face")
     except Exception as e:
         raise HTTPException(status_code=500, detail="No face detected.")
+    ebd = torch.tensor(embedding_objs[0]['embedding'], dtype=torch.float32).to(device)
+    with torch.no_grad():
+        logits = model(ebd)
+        probs = torch.sigmoid(logits).cpu().numpy()
+    pred_binary = (probs > 0.5).astype(int)
+    return pred_binary

model.py ADDED Viewed

	@@ -0,0 +1,210 @@

+import logging
+import pickle
+from concurrent.futures import ProcessPoolExecutor, as_completed
+from pathlib import Path
+import pandas
+import pandas as pd
+import torch
+from deepface import DeepFace
+from sklearn.metrics import accuracy_score, recall_score, f1_score
+from torch import nn
+from torch.utils.data import Dataset, DataLoader
+from tqdm import tqdm
+import torch.nn.functional as F
+TARGET_LABELS = ["Male", "Young", "Oval_Face", "High_Cheekbones", "Big_Lips", "Big_Nose"]
+def load_df(target_labels: list[str]):
+    # 1. load CSV file
+    partition_df = pd.read_csv('./data/list_eval_partition.csv')
+    labels_df = pd.read_csv('./data/list_attr_celeba.csv')
+    # 2. merge two tables
+    df = pd.merge(partition_df, labels_df, on='image_id')
+    # 3. mapping label: -1 -> 0
+    for label in target_labels:
+        df[label] = (df[label] + 1) // 2  # 转成 0/1
+    # 4. subset
+    train_df = df[df['partition'] != 2]
+    test_df = df[df['partition'] == 2]
+    return train_df, test_df
+class EmbeddingDataset(Dataset):
+    def __init__(self, df: pandas.DataFrame, target_labels: list[str]):
+        self.df = df
+        self.image_root = Path("./data/img_align_celeba/img_align_celeba/")
+        self.target_labels = target_labels
+        self.preprocess()
+    def preprocess(self):
+        to_process_images = [image_id for image_id in self.df['image_id'] if
+                             not (self.image_root / f"{image_id}.pkl").exists()]
+        if len(to_process_images) > 0:
+            logging.info(f"Preprocessing {len(to_process_images)} images")
+        else:
+            return
+        with ProcessPoolExecutor() as executor:
+            futures = [executor.submit(self._process_image, image_id) for image_id in to_process_images]
+            for future in tqdm(as_completed(futures), total=len(futures), desc="Preprocessing"):
+                try:
+                    future.result()
+                except Exception as e:
+                    logging.error(f"Error processing image: {e}")
+    def _process_image(self, image_id: str):
+        # Get the image path and cache file path
+        image_path = self.image_root / image_id
+        cache_file = self.image_root / f"{image_id}.pkl"
+        # Check if the embedding is already cached
+        if not cache_file.exists():
+            # Generate the embedding if it is not cached
+            embedding_obj = DeepFace.represent(
+                img_path=str(image_path),
+                model_name="VGG-Face",
+                enforce_detection=False
+            )
+            embedding = torch.tensor(embedding_obj[0]["embedding"], dtype=torch.float32)
+            # Save the embedding to a pickle file for future use
+            with open(cache_file, "wb") as f:
+                pickle.dump(embedding, f)
+    def __len__(self):
+        return len(self.df)
+    def __getitem__(self, idx):
+        row = self.df.iloc[idx]
+        # Get embedding
+        cache_file = self.image_root / f"{row['image_id']}.pkl"
+        with open(cache_file, "rb") as f:
+            embedding = pickle.load(f)
+        # Get labels
+        labels = torch.from_numpy(row[self.target_labels].values.astype(int))
+        return embedding, labels
+class MultiLabelClassifier(nn.Module):
+    def __init__(self, embedding_dim: int, hidden_dim: int):
+        super().__init__()
+        self.embedding_dim = embedding_dim
+        self.hidden_dim = hidden_dim
+        self.output_dim = len(TARGET_LABELS)
+        self.dropout = 0.1
+        self.classifier = nn.Sequential(
+            nn.Linear(embedding_dim, self.hidden_dim),
+            nn.ReLU(inplace=True),
+            nn.Dropout(self.dropout),
+            nn.Linear(hidden_dim, hidden_dim // 2),
+            nn.ReLU(inplace=True),
+            nn.Dropout(self.dropout),
+            nn.Linear(hidden_dim // 2, len(TARGET_LABELS)),
+        )
+    def forward(self, x):
+        return self.classifier(x)
+class FocalLoss(nn.Module):
+    def __init__(self, alpha=1.0, gamma=2.0, reduction='mean'):
+        super(FocalLoss, self).__init__()
+        self.alpha = alpha
+        self.gamma = gamma
+        self.reduction = reduction
+    def forward(self, inputs: torch.Tensor, targets: torch.Tensor):
+        probs = torch.sigmoid(inputs)
+        ce_loss = F.binary_cross_entropy(probs, targets.float(), reduction='none')
+        pt = torch.where(targets == 1, probs, 1 - probs)
+        focal_loss = self.alpha * (1 - pt) ** self.gamma * ce_loss
+        if self.reduction == 'mean':
+            return focal_loss.mean()
+        elif self.reduction == 'sum':
+            return focal_loss.sum()
+        else:
+            return focal_loss
+def main():
+    logging.basicConfig(
+        level=logging.INFO,
+        format='%(asctime)s - %(levelname)s - %(message)s',
+        handlers=[
+            logging.FileHandler("train.log"),
+            logging.StreamHandler()  # Also log to the console
+        ]
+    )
+    train_df, test_df = load_df(TARGET_LABELS)
+    # filter df
+    # train_df, test_df = train_df[train_df.index % 5 == 0], test_df[test_df.index % 5 == 0]
+    train_dataset = EmbeddingDataset(train_df, TARGET_LABELS)
+    test_dataset = EmbeddingDataset(test_df, TARGET_LABELS)
+    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=False)
+    test_loader = DataLoader(test_dataset, batch_size=32)
+    logging.info(f"Initializing Dataset, train_loader: {len(train_loader)}, test_loader: {len(test_loader)}")
+    device = torch.device("mps")
+    logging.info(f"Using device: {device}")
+    model = MultiLabelClassifier(embedding_dim=4096, hidden_dim=1024).to(device)
+    optimizer = torch.optim.Adam(model.parameters(), lr=1e-3)
+    # criterion = nn.BCEWithLogitsLoss()
+    criterion = FocalLoss(alpha=0.5, gamma=2.0)
+    logging.info("Initializing model, optimizer and criterion")
+    logging.info("Starting training")
+    for epoch in range(50):
+        model.train()
+        for inputs, targets in tqdm(train_loader, desc=f"Training Epoch {epoch}"):
+            inputs, targets = inputs.to(device), targets.to(device)
+            outputs = model(inputs)
+            loss = criterion(outputs, targets.float())
+            optimizer.zero_grad()
+            loss.backward()
+            optimizer.step()
+        logging.info(f"Epoch {epoch}, Loss: {loss.item():.4f}")
+        if epoch % 5 == 0:
+            model.eval()
+            test_loss = 0.0
+            all_preds = []
+            all_targets = []
+            with torch.no_grad():
+                for inputs, targets in tqdm(test_loader, desc=f"Test Epoch {epoch}"):
+                    inputs, targets = inputs.to(device), targets.to(device)
+                    outputs = model(inputs)
+                    loss = criterion(outputs, targets.float())
+                    test_loss += loss.item()
+                    predicted = torch.sigmoid(outputs) > 0.5
+                    all_preds.append(predicted)
+                    all_targets.append(targets)
+            avg_test_loss = test_loss / len(test_loader)
+            all_preds = torch.cat(all_preds).cpu().numpy()
+            all_targets = torch.cat(all_targets).cpu().numpy()
+            accuracy = accuracy_score(all_targets, all_preds)
+            recall = recall_score(all_targets, all_preds, average='macro')
+            f1 = f1_score(all_targets, all_preds, average='macro')
+            logging.info(
+                f"Epoch {epoch} - Test Loss: {avg_test_loss:.4f}, Accuracy: {accuracy:.2f}, Recall: {recall:.2f}, F1: {f1:.2f}")
+    torch.save(model.state_dict(), "data/classifier.pth")
+if __name__ == "__main__":
+    main()

requirements.txt CHANGED Viewed

@@ -3,4 +3,9 @@ numpy
 requests
 fastapi[standard]
 opencv-python
-tf-keras

 requests
 fastapi[standard]
 opencv-python
+tf-keras
+pandas
+torch
+scikit-learn
+gradio
+tqdm