Spaces:

yourbench
/

demo

Running on CPU Upgrade

App Files Files Community

tfrere commited on Apr 1

Commit

d6f0b38

1 Parent(s): 2d879b7

block >1mo files | translate comments in english

Browse files

Files changed (10) hide show

backend/routes/benchmark.py +16 -16
backend/tasks/evaluation_task.py +12 -12
backend/tests/run_bench.py +1 -1
backend/tests/run_lighteval.py +3 -3
frontend/src/App.js +14 -14
frontend/src/components/BenchmarkCreateForm.jsx +23 -0
frontend/src/components/BenchmarkDisplay.jsx +5 -20
frontend/src/pages/BenchmarkDisplayPage.jsx +11 -16
frontend/src/pages/BenchmarkEvaluationPage.jsx +6 -10
test_import.py +2 -2

backend/routes/benchmark.py CHANGED Viewed

@@ -27,9 +27,9 @@ async def generate_benchmark(data: Dict[str, Any]):
     """
     session_id = data.get("session_id")
-    # Débogage pour vérifier les session_files et le session_id reçu
-    print(f"DEBUG: Session ID reçu: {session_id}")
-    print(f"DEBUG: Session files disponibles: {list(router.session_files.keys())}")
     if not session_id or session_id not in router.session_files:
         return {"error": "Invalid or missing session ID"}
@@ -112,9 +112,9 @@ class UnifiedBenchmarkTask:
         Args:
             message: Log message to add
         """
-        if message not in self.logs:  # Éviter les doublons
             self.logs.append(message)
-            # Forcer une copie pour éviter les problèmes de référence
             self.logs = self.logs.copy()
             print(f"[{self.session_uid}] {message}")
@@ -143,7 +143,7 @@ class UnifiedBenchmarkTask:
         Args:
             file_path: Path to the uploaded file
         """
-        # Démarrer dans un thread séparé pour ne pas bloquer
         import threading
         thread = threading.Thread(target=self._run_process, args=(file_path,))
         thread.daemon = True
@@ -157,43 +157,43 @@ class UnifiedBenchmarkTask:
             file_path: Path to the uploaded file
         """
         try:
-            # Étape 1: Configuration
             self._add_log("[INFO] Starting configuration process")
             self.config_task = CreateBenchConfigTask(session_uid=self.session_uid)
-            # Exécuter la tâche de configuration
             config_path = self.config_task.run(file_path=file_path)
-            # Récupérer les logs de configuration
             config_logs = self.config_task.get_logs()
             for log in config_logs:
                 self._add_log(log)
-            # Marquer l'étape de configuration comme terminée
             if "[SUCCESS] Stage completed: config_generation" not in self.logs:
                 self._add_log("[SUCCESS] Stage completed: configuration")
-            # Étape 2: Benchmark
             self._add_log("[INFO] Starting benchmark process")
             self.bench_task = CreateBenchTask(session_uid=self.session_uid, config_path=config_path)
-            # Exécuter la tâche de benchmark
             self.bench_task.run()
-            # Attendre que la tâche de benchmark soit terminée
             while not self.bench_task.is_task_completed():
-                # Récupérer les nouveaux logs et les ajouter
                 bench_logs = self.bench_task.get_logs()
                 for log in bench_logs:
                     self._add_log(log)
                 time.sleep(1)
-            # Récupérer les logs finaux
             final_logs = self.bench_task.get_logs()
             for log in final_logs:
                 self._add_log(log)
-            # Marquer comme terminé
             self.is_completed = True
             self._add_log("[SUCCESS] Benchmark process completed successfully")

     """
     session_id = data.get("session_id")
+    # Debug to check session_files and received session_id
+    print(f"DEBUG: Session ID received: {session_id}")
+    print(f"DEBUG: Available session files: {list(router.session_files.keys())}")
     if not session_id or session_id not in router.session_files:
         return {"error": "Invalid or missing session ID"}
         Args:
             message: Log message to add
         """
+        if message not in self.logs:  # Avoid duplicates
             self.logs.append(message)
+            # Force a copy to avoid reference problems
             self.logs = self.logs.copy()
             print(f"[{self.session_uid}] {message}")
         Args:
             file_path: Path to the uploaded file
         """
+        # Start in a separate thread to avoid blocking
         import threading
         thread = threading.Thread(target=self._run_process, args=(file_path,))
         thread.daemon = True
             file_path: Path to the uploaded file
         """
         try:
+            # Step 1: Configuration
             self._add_log("[INFO] Starting configuration process")
             self.config_task = CreateBenchConfigTask(session_uid=self.session_uid)
+            # Execute the configuration task
             config_path = self.config_task.run(file_path=file_path)
+            # Get configuration logs
             config_logs = self.config_task.get_logs()
             for log in config_logs:
                 self._add_log(log)
+            # Mark configuration step as completed
             if "[SUCCESS] Stage completed: config_generation" not in self.logs:
                 self._add_log("[SUCCESS] Stage completed: configuration")
+            # Step 2: Benchmark
             self._add_log("[INFO] Starting benchmark process")
             self.bench_task = CreateBenchTask(session_uid=self.session_uid, config_path=config_path)
+            # Run the benchmark task
             self.bench_task.run()
+            # Wait for the benchmark task to complete
             while not self.bench_task.is_task_completed():
+                # Get new logs and add them
                 bench_logs = self.bench_task.get_logs()
                 for log in bench_logs:
                     self._add_log(log)
                 time.sleep(1)
+            # Get final logs
             final_logs = self.bench_task.get_logs()
             for log in final_logs:
                 self._add_log(log)
+            # Mark as completed
             self.is_completed = True
             self._add_log("[SUCCESS] Benchmark process completed successfully")

backend/tasks/evaluation_task.py CHANGED Viewed

@@ -47,28 +47,28 @@ class EvaluationTask:
     def clean_old_results(self) -> None:
         """
-        Nettoie les anciens résultats d'évaluation pour éviter toute confusion
         """
-        print(f"[{datetime.now().strftime('%H:%M:%S')}] Vérification et nettoyage des anciens résultats...")
-        # Chemin vers les résultats LightEval
         results_dir = Path(f"uploaded_files/{self.session_uid}/lighteval_results")
-        # Supprimer si existant
         if results_dir.exists():
-            print(f"[{datetime.now().strftime('%H:%M:%S')}] Suppression des anciens résultats LightEval")
             shutil.rmtree(results_dir)
-            print(f"[{datetime.now().strftime('%H:%M:%S')}] Nettoyage terminé")
         else:
-            print(f"[{datetime.now().strftime('%H:%M:%S')}] Aucun ancien résultat trouvé")
-        # Vérifier aussi les résultats intermédiaires de lighteval
         if os.path.exists("data/lighteval_results"):
-            print(f"[{datetime.now().strftime('%H:%M:%S')}] Nettoyage des résultats intermédiaires")
             try:
                 shutil.rmtree("data/lighteval_results", ignore_errors=True)
             except Exception as e:
-                print(f"[{datetime.now().strftime('%H:%M:%S')}] Erreur lors du nettoyage des résultats intermédiaires: {str(e)}")
     def _save_results_to_hub(self) -> None:
         """
@@ -224,9 +224,9 @@ TASKS_TABLE = [yourbench]
         Run the evaluation task asynchronously
         Args:
-            clean_first: If True, clean old results before starting (par défaut: True)
         """
-        # Nettoyer systématiquement les anciens résultats avant de commencer
         self.clean_old_results()
         # Start global timer

     def clean_old_results(self) -> None:
         """
+        Clean old evaluation results to avoid confusion
         """
+        print(f"[{datetime.now().strftime('%H:%M:%S')}] Checking and cleaning old results...")
+        # Path to LightEval results
         results_dir = Path(f"uploaded_files/{self.session_uid}/lighteval_results")
+        # Delete if exists
         if results_dir.exists():
+            print(f"[{datetime.now().strftime('%H:%M:%S')}] Deleting old LightEval results")
             shutil.rmtree(results_dir)
+            print(f"[{datetime.now().strftime('%H:%M:%S')}] Cleaning complete")
         else:
+            print(f"[{datetime.now().strftime('%H:%M:%S')}] No old results found")
+        # Also check for intermediate lighteval results
         if os.path.exists("data/lighteval_results"):
+            print(f"[{datetime.now().strftime('%H:%M:%S')}] Cleaning intermediate results")
             try:
                 shutil.rmtree("data/lighteval_results", ignore_errors=True)
             except Exception as e:
+                print(f"[{datetime.now().strftime('%H:%M:%S')}] Error cleaning intermediate results: {str(e)}")
     def _save_results_to_hub(self) -> None:
         """
         Run the evaluation task asynchronously
         Args:
+            clean_first: If True, clean old results before starting (default: True)
         """
+        # Systematically clean old results before starting
         self.clean_old_results()
         # Start global timer

backend/tests/run_bench.py CHANGED Viewed

@@ -20,4 +20,4 @@ subprocess.run(command, env=os.environ)
 # Calculate and print execution time
 execution_time = time.time() - start_time
-print(f"\nTemps d'exécution : {execution_time:.2f} secondes")

 # Calculate and print execution time
 execution_time = time.time() - start_time
+print(f"\nExecution time: {execution_time:.2f} seconds")

backend/tests/run_lighteval.py CHANGED Viewed

@@ -22,7 +22,7 @@ yourbench = create_yourbench_task("yourbench/yourbench_fbfe278f-70c8-4579-9447-8
 TASKS_TABLE = [yourbench]
 """)
-# Créer un dossier de sortie avec timestamp pour éviter d'écraser les anciens résultats
 output_dir = f"data/lighteval_results_strict_{datetime.datetime.now().strftime('%Y%m%d_%H%M%S')}"
 # LightEval command
@@ -48,8 +48,8 @@ subprocess.run(cmd_args, env=os.environ)
 # Calculate and print execution time
 execution_time = time.time() - start_time
-print(f"\nTemps d'exécution : {execution_time:.2f} secondes")
-print(f"Résultats sauvegardés dans : {output_dir}")
 # Clean up
 os.unlink(temp_file_path)

 TASKS_TABLE = [yourbench]
 """)
+# Create an output folder with timestamp to avoid overwriting previous results
 output_dir = f"data/lighteval_results_strict_{datetime.datetime.now().strftime('%Y%m%d_%H%M%S')}"
 # LightEval command
 # Calculate and print execution time
 execution_time = time.time() - start_time
+print(f"\nExecution time: {execution_time:.2f} seconds")
+print(f"Results saved in: {output_dir}")
 # Clean up
 os.unlink(temp_file_path)

frontend/src/App.js CHANGED Viewed

@@ -17,12 +17,12 @@ import BenchmarkDisplayPage from "./pages/BenchmarkDisplayPage";
 import BenchmarkEvaluationPage from "./pages/BenchmarkEvaluationPage";
 import EvaluationDisplayPage from "./pages/EvaluationDisplayPage";
-// Fonction pour synchroniser les hash URL avec la page parente Hugging Face
 const syncURLWithParent = () => {
-  // Cette fonction est nécessaire uniquement dans un environnement Hugging Face Spaces
   if (window.parent !== window) {
     try {
-      // On envoie le hash actuel à la page parente (Hugging Face)
       window.parent.postMessage(
         {
           hash: window.location.hash,
@@ -30,7 +30,7 @@ const syncURLWithParent = () => {
         "https://huggingface.co"
       );
-      // On log pour débogage
       console.log("Synced hash with parent:", window.location.hash);
     } catch (error) {
       console.error("Error syncing URL with parent:", error);
@@ -42,36 +42,36 @@ function App() {
   const { mode } = useThemeMode();
   const theme = getTheme(mode);
-  // Effet pour surveiller les changements de hash et les synchroniser
   useEffect(() => {
-    // Fonction de gestionnaire d'événements pour les changements de hash
     const handleHashChange = () => {
       syncURLWithParent();
     };
-    // Fonction pour gérer les messages reçus de la page parente
     const handleParentMessage = (event) => {
-      // Vérifier que le message vient bien de Hugging Face
       if (event.origin === "https://huggingface.co") {
-        // Si le message contient un hash et qu'il est différent du hash actuel
         if (event.data.hash && event.data.hash !== window.location.hash) {
           console.log("Received hash from parent:", event.data.hash);
-          // Mettre à jour le hash de l'URL sans recharger la page
           window.location.hash = event.data.hash;
         }
       }
     };
-    // On synchronise au chargement initial
     syncURLWithParent();
-    // On écoute les changements de hash
     window.addEventListener("hashchange", handleHashChange);
-    // On écoute les messages de la page parente
     window.addEventListener("message", handleParentMessage);
-    // Nettoyage
     return () => {
       window.removeEventListener("hashchange", handleHashChange);
       window.removeEventListener("message", handleParentMessage);

 import BenchmarkEvaluationPage from "./pages/BenchmarkEvaluationPage";
 import EvaluationDisplayPage from "./pages/EvaluationDisplayPage";
+// Function to synchronize URL hash with parent Hugging Face page
 const syncURLWithParent = () => {
+  // This function is only necessary in a Hugging Face Spaces environment
   if (window.parent !== window) {
     try {
+      // Send the current hash to the parent page (Hugging Face)
       window.parent.postMessage(
         {
           hash: window.location.hash,
         "https://huggingface.co"
       );
+      // Log for debugging
       console.log("Synced hash with parent:", window.location.hash);
     } catch (error) {
       console.error("Error syncing URL with parent:", error);
   const { mode } = useThemeMode();
   const theme = getTheme(mode);
+  // Effect to monitor hash changes and synchronize them
   useEffect(() => {
+    // Event handler function for hash changes
     const handleHashChange = () => {
       syncURLWithParent();
     };
+    // Function to handle messages received from the parent page
     const handleParentMessage = (event) => {
+      // Verify that the message comes from Hugging Face
       if (event.origin === "https://huggingface.co") {
+        // If the message contains a hash and it's different from the current hash
         if (event.data.hash && event.data.hash !== window.location.hash) {
           console.log("Received hash from parent:", event.data.hash);
+          // Update the URL hash without reloading the page
           window.location.hash = event.data.hash;
         }
       }
     };
+    // Synchronize on initial load
     syncURLWithParent();
+    // Listen for hash changes
     window.addEventListener("hashchange", handleHashChange);
+    // Listen for messages from the parent page
     window.addEventListener("message", handleParentMessage);
+    // Cleanup
     return () => {
       window.removeEventListener("hashchange", handleHashChange);
       window.removeEventListener("message", handleParentMessage);

frontend/src/components/BenchmarkCreateForm.jsx CHANGED Viewed

@@ -96,6 +96,17 @@ function BenchmarkCreateForm({ onStartGeneration }) {
         success: false,
         message: "Only PDF, TXT, HTML and MD files are accepted",
       });
       return;
     }
@@ -152,6 +163,7 @@ function BenchmarkCreateForm({ onStartGeneration }) {
     const file = e.dataTransfer.files[0];
     if (!file) {
       setUploadStatus({ success: false, message: "No file detected" });
       return;
     }
@@ -166,6 +178,17 @@ function BenchmarkCreateForm({ onStartGeneration }) {
         success: false,
         message: "Only PDF, TXT, HTML and MD files are accepted",
       });
       return;
     }

         success: false,
         message: "Only PDF, TXT, HTML and MD files are accepted",
       });
+      setOpenSnackbar(true);
+      return;
+    }
+    // Check file size limit (1MB = 1048576 bytes)
+    if (file.size > 1048576) {
+      setUploadStatus({
+        success: false,
+        message: "File size exceeds the 1MB limit",
+      });
+      setOpenSnackbar(true);
       return;
     }
     const file = e.dataTransfer.files[0];
     if (!file) {
       setUploadStatus({ success: false, message: "No file detected" });
+      setOpenSnackbar(true);
       return;
     }
         success: false,
         message: "Only PDF, TXT, HTML and MD files are accepted",
       });
+      setOpenSnackbar(true);
+      return;
+    }
+    // Check file size limit (1MB = 1048576 bytes)
+    if (file.size > 1048576) {
+      setUploadStatus({
+        success: false,
+        message: "File size exceeds the 1MB limit",
+      });
+      setOpenSnackbar(true);
       return;
     }

frontend/src/components/BenchmarkDisplay.jsx CHANGED Viewed

@@ -10,8 +10,6 @@ import {
   Link,
   CircularProgress,
   Tooltip,
-  useTheme,
-  useMediaQuery,
 } from "@mui/material";
 import PlayArrowIcon from "@mui/icons-material/PlayArrow";
 import AssessmentIcon from "@mui/icons-material/Assessment";
@@ -40,9 +38,7 @@ const BenchmarkDisplay = ({
 }) => {
   const [isDownloading, setIsDownloading] = useState(false);
   const { mode } = useThemeMode();
-  const theme = useTheme();
-  const isMobile = useMediaQuery(theme.breakpoints.down("sm"));
-  const themeColors = getTheme(mode);
   // Default questions if none provided
   const questions =
@@ -99,10 +95,8 @@ const BenchmarkDisplay = ({
         sx={{
           mb: 4,
           display: "flex",
-          flexDirection: isMobile ? "column" : "row",
           justifyContent: "space-between",
-          alignItems: isMobile ? "flex-start" : "center",
-          gap: isMobile ? 2 : 0,
         }}
       >
         <Box sx={{ display: "flex", alignItems: "center" }}>
@@ -110,14 +104,7 @@ const BenchmarkDisplay = ({
           <Typography variant="h6">Benchmark Created Successfully</Typography>
         </Box>
-        <Box
-          sx={{
-            display: "flex",
-            gap: 2,
-            width: isMobile ? "100%" : "auto",
-            flexDirection: isMobile ? "column" : "row",
-          }}
-        >
           <Tooltip title="Download the complete benchmark">
             <Button
               variant="outlined"
@@ -131,7 +118,6 @@ const BenchmarkDisplay = ({
               }
               onClick={handleDownloadClick}
               disabled={isDownloading || !sessionId}
-              fullWidth={isMobile}
             >
               {isDownloading ? "Downloading..." : "Download Benchmark"}
             </Button>
@@ -142,7 +128,6 @@ const BenchmarkDisplay = ({
             color="primary"
             startIcon={<AssessmentIcon />}
             onClick={handleEvaluationClick}
-            fullWidth={isMobile}
           >
             Start Evaluation
           </Button>
@@ -160,8 +145,8 @@ const BenchmarkDisplay = ({
             variant="outlined"
             sx={{
               mb: 2,
-              backgroundColor: themeColors.palette.background.subtle,
-              border: `1px solid ${themeColors.palette.divider}`,
             }}
           >
             <CardContent>

   Link,
   CircularProgress,
   Tooltip,
 } from "@mui/material";
 import PlayArrowIcon from "@mui/icons-material/PlayArrow";
 import AssessmentIcon from "@mui/icons-material/Assessment";
 }) => {
   const [isDownloading, setIsDownloading] = useState(false);
   const { mode } = useThemeMode();
+  const theme = getTheme(mode);
   // Default questions if none provided
   const questions =
         sx={{
           mb: 4,
           display: "flex",
           justifyContent: "space-between",
+          alignItems: "center",
         }}
       >
         <Box sx={{ display: "flex", alignItems: "center" }}>
           <Typography variant="h6">Benchmark Created Successfully</Typography>
         </Box>
+        <Box sx={{ display: "flex", gap: 2 }}>
           <Tooltip title="Download the complete benchmark">
             <Button
               variant="outlined"
               }
               onClick={handleDownloadClick}
               disabled={isDownloading || !sessionId}
             >
               {isDownloading ? "Downloading..." : "Download Benchmark"}
             </Button>
             color="primary"
             startIcon={<AssessmentIcon />}
             onClick={handleEvaluationClick}
           >
             Start Evaluation
           </Button>
             variant="outlined"
             sx={{
               mb: 2,
+              backgroundColor: theme.palette.background.subtle,
+              border: `1px solid ${theme.palette.divider}`,
             }}
           >
             <CardContent>

frontend/src/pages/BenchmarkDisplayPage.jsx CHANGED Viewed

@@ -22,7 +22,7 @@ function BenchmarkDisplayPage() {
     console.log("BenchmarkDisplayPage useEffect - sessionId:", sessionId);
     if (!sessionId) {
-      console.log("Session ID manquante, redirection vers l'accueil");
       setIsValidSession(false);
       return;
     }
@@ -30,39 +30,34 @@ function BenchmarkDisplayPage() {
     setIsLoading(true);
     const fetchBenchmarkQuestions = async () => {
-      console.log(
-        "Tentative de récupération des questions pour la session:",
-        sessionId
-      );
       try {
         const apiUrl = `${API_CONFIG.BASE_URL}/benchmark-questions/${sessionId}`;
-        console.log("Appel API:", apiUrl);
         const response = await fetch(apiUrl);
-        console.log("Réponse API reçue:", response.status);
         if (!response.ok) {
           if (response.status === 404) {
-            console.error("Session non trouvée");
             setIsValidSession(false);
             return;
           } else {
-            console.error(`Erreur serveur: ${response.status}`);
             setIsLoading(false);
             return;
           }
         }
         const data = await response.json();
-        console.log("Données API:", data);
         if (data.success && data.questions && data.questions.length > 0) {
-          console.log("Questions chargées avec succès:", data.questions);
           setBenchmarkQuestions(data.questions);
         } else {
-          console.warn(
-            "Échec du chargement des questions, utilisation des valeurs par défaut"
-          );
         }
         if (data.dataset_url) {
@@ -70,10 +65,10 @@ function BenchmarkDisplayPage() {
         } else {
           const url = `https://huggingface.co/datasets/yourbench/yourbench_${sessionId}`;
           setDatasetUrl(url);
-          console.log("URL du dataset générée:", url);
         }
       } catch (error) {
-        console.error("Erreur lors de la récupération des questions:", error);
         setIsValidSession(false);
       } finally {
         setIsLoading(false);

     console.log("BenchmarkDisplayPage useEffect - sessionId:", sessionId);
     if (!sessionId) {
+      console.log("Missing session ID, redirecting to home");
       setIsValidSession(false);
       return;
     }
     setIsLoading(true);
     const fetchBenchmarkQuestions = async () => {
+      console.log("Attempting to fetch questions for session:", sessionId);
       try {
         const apiUrl = `${API_CONFIG.BASE_URL}/benchmark-questions/${sessionId}`;
+        console.log("API call:", apiUrl);
         const response = await fetch(apiUrl);
+        console.log("API response received:", response.status);
         if (!response.ok) {
           if (response.status === 404) {
+            console.error("Session not found");
             setIsValidSession(false);
             return;
           } else {
+            console.error(`Server error: ${response.status}`);
             setIsLoading(false);
             return;
           }
         }
         const data = await response.json();
+        console.log("API data:", data);
         if (data.success && data.questions && data.questions.length > 0) {
+          console.log("Questions loaded successfully:", data.questions);
           setBenchmarkQuestions(data.questions);
         } else {
+          console.warn("Failed to load questions, using default values");
         }
         if (data.dataset_url) {
         } else {
           const url = `https://huggingface.co/datasets/yourbench/yourbench_${sessionId}`;
           setDatasetUrl(url);
+          console.log("Dataset URL generated:", url);
         }
       } catch (error) {
+        console.error("Error retrieving questions:", error);
         setIsValidSession(false);
       } finally {
         setIsLoading(false);

frontend/src/pages/BenchmarkEvaluationPage.jsx CHANGED Viewed

@@ -17,14 +17,12 @@ function BenchmarkEvaluationPage() {
   useEffect(() => {
     if (!sessionId) {
-      console.log(
-        "Session ID manquante pour l'évaluation, redirection vers l'accueil"
-      );
       setIsValidSession(false);
       return;
     }
-    // Si c'est un document précalculé, on le considère comme valide directement
     if (isDefault) {
       setIsLoading(false);
       return;
@@ -37,13 +35,11 @@ function BenchmarkEvaluationPage() {
         );
         if (!response.ok) {
-          console.error(
-            `Session invalide ou erreur serveur: ${response.status}`
-          );
           setIsValidSession(false);
         }
       } catch (error) {
-        console.error("Erreur lors de la vérification de la session:", error);
         setIsValidSession(false);
       } finally {
         setIsLoading(false);
@@ -54,8 +50,8 @@ function BenchmarkEvaluationPage() {
   }, [sessionId, isDefault]);
   const handleEvaluationComplete = (result) => {
-    console.log("Évaluation terminée:", result);
-    // La redirection est gérée par le composant BenchmarkEvaluation
   };
   if (!isValidSession) {

   useEffect(() => {
     if (!sessionId) {
+      console.log("Missing session ID for evaluation, redirecting to home");
       setIsValidSession(false);
       return;
     }
+    // If it's a precalculated document, consider it valid directly
     if (isDefault) {
       setIsLoading(false);
       return;
         );
         if (!response.ok) {
+          console.error(`Invalid session or server error: ${response.status}`);
           setIsValidSession(false);
         }
       } catch (error) {
+        console.error("Error checking session:", error);
         setIsValidSession(false);
       } finally {
         setIsLoading(false);
   }, [sessionId, isDefault]);
   const handleEvaluationComplete = (result) => {
+    console.log("Evaluation completed:", result);
+    // Redirection is handled by the BenchmarkEvaluation component
   };
   if (!isValidSession) {

test_import.py CHANGED Viewed

@@ -1,5 +1,5 @@
 try:
     import lighteval_task
-    print("lighteval_task importé avec succès!")
 except ImportError as e:
-    print(f"Erreur: {e}")

 try:
     import lighteval_task
+    print("lighteval_task imported successfully!")
 except ImportError as e:
+    print(f"Error: {e}")