|
name: "π€ Model Evaluation Request" |
|
description: Request EvalPlus maintainers to evaluate your model independently and update it on our leaderboard. |
|
title: "π€ [REQUEST] - <MODEL_NAME>" |
|
labels: ["model eval"] |
|
body: |
|
- type: textarea |
|
id: about |
|
attributes: |
|
label: "Model introduction" |
|
description: Provide a brief introduction to the model. |
|
placeholder: The models is created by ... and is used for ... |
|
validations: |
|
required: true |
|
- type: input |
|
id: url |
|
attributes: |
|
label: "Model URL" |
|
description: Indicate the URL (e.g., huggingface or other release pages) of the model |
|
placeholder: https://huggingface.co/[???]/[???] |
|
validations: |
|
required: true |
|
- type: dropdown |
|
id: dtype |
|
attributes: |
|
label: "Data type" |
|
description: What is the intended data type for running the model? |
|
multiple: false |
|
options: |
|
- "float16" |
|
- "bfloat16" |
|
- "float32" |
|
- "None of above: specify the details in the 'Other context' section" |
|
validations: |
|
required: true |
|
- type: textarea |
|
id: other |
|
attributes: |
|
label: "Additional instructions (Optional)" |
|
description: Special steps indicating how to run the model with preferably scripts/codes. |
|
placeholder: What data type precision should be used? What is the minimal hardware requirement? Can it be accelerated by tools such as vLLM? |
|
validations: |
|
required: false |
|
- type: dropdown |
|
id: author |
|
attributes: |
|
label: "Author" |
|
description: "Are you (one of) the author(s) of the model?" |
|
multiple: false |
|
options: |
|
- "Yes" |
|
- "No" |
|
validations: |
|
required: true |
|
- type: checkboxes |
|
id: security |
|
attributes: |
|
label: "Security" |
|
options: |
|
- label: "I confirm that the model is safe to run which does not contain any malicious code or content." |
|
required: true |
|
- type: checkboxes |
|
id: integrity |
|
attributes: |
|
label: "Integrity" |
|
options: |
|
- label: "I confirm that the model comes from unique and original work and does not contain any plagiarism." |
|
required: true |
|
|