Spaces:
Running
Running
add hallucination to how to submit | fix show arena only behaviour
Browse files
client/deps/_metadata.json
DELETED
@@ -1,8 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"hash": "dad2c8bd",
|
3 |
-
"configHash": "82e0a188",
|
4 |
-
"lockfileHash": "e3b0c442",
|
5 |
-
"browserHash": "9b3dc129",
|
6 |
-
"optimized": {},
|
7 |
-
"chunks": {}
|
8 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
client/deps/package.json
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"type": "module"
|
3 |
-
}
|
|
|
|
|
|
|
|
client/src/pages/HowToSubmitPage/HowToSubmitPage.jsx
CHANGED
@@ -223,6 +223,7 @@ const getTagEmoji = (tag) => {
|
|
223 |
reasoning: "🧠",
|
224 |
performance: "⚡",
|
225 |
safety: "🛡️",
|
|
|
226 |
},
|
227 |
task: {
|
228 |
rag: "🔍",
|
@@ -666,6 +667,7 @@ const HowToSubmitPage = () => {
|
|
666 |
"eval:reasoning",
|
667 |
"eval:performance",
|
668 |
"eval:safety",
|
|
|
669 |
"eval:rag",
|
670 |
]}
|
671 |
explanations={[
|
@@ -675,6 +677,7 @@ const HowToSubmitPage = () => {
|
|
675 |
"the evaluation tests <strong>reasoning abilities</strong>",
|
676 |
"model <strong>performance</strong> (speed, energy consumption, ...)",
|
677 |
"the evaluation considers <strong>safety</strong>, <strong>toxicity</strong>, <strong>bias</strong>",
|
|
|
678 |
"the evaluation tests <strong>RAG</strong> (Retrieval-Augmented Generation) capabilities",
|
679 |
]}
|
680 |
/>
|
|
|
223 |
reasoning: "🧠",
|
224 |
performance: "⚡",
|
225 |
safety: "🛡️",
|
226 |
+
hallucination: "🌫️",
|
227 |
},
|
228 |
task: {
|
229 |
rag: "🔍",
|
|
|
667 |
"eval:reasoning",
|
668 |
"eval:performance",
|
669 |
"eval:safety",
|
670 |
+
"eval:hallucination",
|
671 |
"eval:rag",
|
672 |
]}
|
673 |
explanations={[
|
|
|
677 |
"the evaluation tests <strong>reasoning abilities</strong>",
|
678 |
"model <strong>performance</strong> (speed, energy consumption, ...)",
|
679 |
"the evaluation considers <strong>safety</strong>, <strong>toxicity</strong>, <strong>bias</strong>",
|
680 |
+
"the evaluation measures the model's tendency to <strong>hallucinate</strong> or generate <strong>false information</strong>",
|
681 |
"the evaluation tests <strong>RAG</strong> (Retrieval-Augmented Generation) capabilities",
|
682 |
]}
|
683 |
/>
|
client/src/pages/LeaderboardPage/LeaderboardPage.jsx
CHANGED
@@ -34,9 +34,9 @@ const LeaderboardPageContent = () => {
|
|
34 |
leaderboards,
|
35 |
} = useLeaderboard();
|
36 |
|
37 |
-
// Vérifier si on a uniquement une recherche textuelle active
|
38 |
const isOnlyTextSearch =
|
39 |
-
searchQuery
|
40 |
|
41 |
// Obtenir tous les leaderboards uniques de toutes les sections
|
42 |
const allUniqueLeaderboards = useMemo(() => {
|
@@ -66,7 +66,7 @@ const LeaderboardPageContent = () => {
|
|
66 |
);
|
67 |
}, [leaderboards]);
|
68 |
|
69 |
-
// Filtrer tous les leaderboards pour la recherche textuelle
|
70 |
const searchResults = useMemo(() => {
|
71 |
if (!isOnlyTextSearch) return [];
|
72 |
return filterLeaderboards(allUniqueLeaderboards);
|
@@ -204,7 +204,13 @@ const LeaderboardPageContent = () => {
|
|
204 |
<Box key="search-results">
|
205 |
<LeaderboardSection
|
206 |
id="search-results"
|
207 |
-
title={
|
|
|
|
|
|
|
|
|
|
|
|
|
208 |
leaderboards={allUniqueLeaderboards}
|
209 |
filteredLeaderboards={searchResults}
|
210 |
/>
|
@@ -214,7 +220,13 @@ const LeaderboardPageContent = () => {
|
|
214 |
<Box key="search-results">
|
215 |
<LeaderboardSection
|
216 |
id="search-results"
|
217 |
-
title={
|
|
|
|
|
|
|
|
|
|
|
|
|
218 |
leaderboards={allUniqueLeaderboards}
|
219 |
filteredLeaderboards={[]}
|
220 |
showEmptyState={true}
|
|
|
34 |
leaderboards,
|
35 |
} = useLeaderboard();
|
36 |
|
37 |
+
// Vérifier si on a uniquement une recherche textuelle active ou arena only
|
38 |
const isOnlyTextSearch =
|
39 |
+
(searchQuery || arenaOnly) && selectedCategories.size === 0;
|
40 |
|
41 |
// Obtenir tous les leaderboards uniques de toutes les sections
|
42 |
const allUniqueLeaderboards = useMemo(() => {
|
|
|
66 |
);
|
67 |
}, [leaderboards]);
|
68 |
|
69 |
+
// Filtrer tous les leaderboards pour la recherche textuelle ou arena only
|
70 |
const searchResults = useMemo(() => {
|
71 |
if (!isOnlyTextSearch) return [];
|
72 |
return filterLeaderboards(allUniqueLeaderboards);
|
|
|
204 |
<Box key="search-results">
|
205 |
<LeaderboardSection
|
206 |
id="search-results"
|
207 |
+
title={
|
208 |
+
searchQuery
|
209 |
+
? `All leaderboards matching "${searchQuery}"${
|
210 |
+
arenaOnly ? " (Arena only)" : ""
|
211 |
+
}`
|
212 |
+
: "All Arena leaderboards"
|
213 |
+
}
|
214 |
leaderboards={allUniqueLeaderboards}
|
215 |
filteredLeaderboards={searchResults}
|
216 |
/>
|
|
|
220 |
<Box key="search-results">
|
221 |
<LeaderboardSection
|
222 |
id="search-results"
|
223 |
+
title={
|
224 |
+
searchQuery
|
225 |
+
? `All leaderboards matching "${searchQuery}"${
|
226 |
+
arenaOnly ? " (Arena only)" : ""
|
227 |
+
}`
|
228 |
+
: "All Arena leaderboards"
|
229 |
+
}
|
230 |
leaderboards={allUniqueLeaderboards}
|
231 |
filteredLeaderboards={[]}
|
232 |
showEmptyState={true}
|