Spaces:
Running
Running
/** | |
* | |
* Copyright 2023-2025 InspectorRAGet Team | |
* | |
* Licensed under the Apache License, Version 2.0 (the "License"); | |
* you may not use this file except in compliance with the License. | |
* You may obtain a copy of the License at | |
* | |
* http://www.apache.org/licenses/LICENSE-2.0 | |
* | |
* Unless required by applicable law or agreed to in writing, software | |
* distributed under the License is distributed on an "AS IS" BASIS, | |
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | |
* See the License for the specific language governing permissions and | |
* limitations under the License. | |
* | |
**/ | |
import { memo } from 'react'; | |
import { Button, ButtonSkeleton, UnorderedList, ListItem } from '@carbon/react'; | |
import { ArrowRight } from '@carbon/icons-react'; | |
import classes from './Instructions.module.scss'; | |
interface Props { | |
loading?: boolean; | |
onClick: Function; | |
} | |
export default memo(function InstructionsView({ | |
loading = false, | |
onClick, | |
}: Props) { | |
return ( | |
<div className={classes.root}> | |
<div className={classes.instructionsContainer}> | |
<h4>Instructions</h4> | |
<p> | |
Use the Analytics platform to examine and analyze LLM evaluation | |
experiments. The experiments are assumed to comprise: | |
</p> | |
<UnorderedList> | |
<ListItem> | |
A dataset of tasks, where each task has at least one triplet of | |
context, grounding document and response. There may be multiple | |
responses, if multiple models are being evaluated simultaneously (at | |
most 5 models are allowed). | |
</ListItem> | |
<ListItem> | |
Each response is evaluated on at least one metric. A metric may be | |
categorical (yes/no, Likert scale) or numeric. One experiment may | |
include any number of categorical or numeric metrics, though we | |
strongly caution against including too many as this makes the | |
instance-level analysis challenging. | |
</ListItem> | |
<ListItem> | |
There is at least one annotator / evaluator. The annotator may be | |
human or algorithm (whether a defined quanititative metric, or an | |
LLM). One experiment may include any number of human or algorithmic | |
annotators. | |
</ListItem> | |
</UnorderedList> | |
<p> | |
Upload your experiment data on the following page, which contains a | |
detailed example of the expected schema. You will need to provide | |
sufficient metadata about the tasks, metrics, and annotators. If the | |
uploaded document is not well-formed, you will see a verification | |
error. | |
</p> | |
</div> | |
<div className={classes.proceedButton}> | |
{loading ? ( | |
<ButtonSkeleton /> | |
) : ( | |
<Button className={classes.proceedButtonContent} onClick={onClick}> | |
<span>Get started</span> | |
<ArrowRight /> | |
</Button> | |
)} | |
</div> | |
</div> | |
); | |
}); | |