File size: 3,858 Bytes
b2ecf7d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
import type { TaskDataCustom } from "../Types";

const taskData: TaskDataCustom = {
	datasets: [
		{
			description: "A large multilingual dataset of text crawled from the web.",
			id: "mc4",
		},
		{
			description:
				"Diverse open-source data consisting of 22 smaller high-quality datasets. It was used to train GPT-Neo.",
			id: "the_pile",
		},
		{
			description: "A crowd-sourced instruction dataset to develop an AI assistant.",
			id: "OpenAssistant/oasst1",
		},
		{
			description: "A crowd-sourced instruction dataset created by Databricks employees.",
			id: "databricks/databricks-dolly-15k",
		},
	],
	demo: {
		inputs: [
			{
				label: "Input",
				content: "Once upon a time,",
				type: "text",
			},
		],
		outputs: [
			{
				label: "Output",
				content:
					"Once upon a time, we knew that our ancestors were on the verge of extinction. The great explorers and poets of the Old World, from Alexander the Great to Chaucer, are dead and gone. A good many of our ancient explorers and poets have",
				type: "text",
			},
		],
	},
	metrics: [
		{
			description:
				"Cross Entropy is a metric that calculates the difference between two probability distributions. Each probability distribution is the distribution of predicted words",
			id: "Cross Entropy",
		},
		{
			description:
				"The Perplexity metric is the exponential of the cross-entropy loss. It evaluates the probabilities assigned to the next word by the model. Lower perplexity indicates better performance",
			id: "Perplexity",
		},
	],
	models: [
		{
			description: "A large language model trained for text generation.",
			id: "bigscience/bloom-560m",
		},
		{
			description: "A large code generation model that can generate code in 80+ languages.",
			id: "bigcode/starcoder",
		},
		{
			description: "A model trained to follow instructions, uses Pythia-12b as base model.",
			id: "databricks/dolly-v2-12b",
		},
		{
			description: "A model trained to follow instructions curated by community, uses Pythia-12b as base model.",
			id: "OpenAssistant/oasst-sft-4-pythia-12b-epoch-3.5",
		},
		{
			description: "A large language model trained to generate text in English.",
			id: "stabilityai/stablelm-tuned-alpha-7b",
		},
		{
			description: "A model trained to follow instructions, based on mosaicml/mpt-7b.",
			id: "mosaicml/mpt-7b-instruct",
		},
		{
			description: "A large language model trained to generate text in English.",
			id: "EleutherAI/pythia-12b",
		},
		{
			description: "A large text-to-text model trained to follow instructions.",
			id: "google/flan-ul2",
		},
		{
			description: "A large and powerful text generation model.",
			id: "tiiuae/falcon-40b",
		},
		{
			description: "State-of-the-art open-source large language model.",
			id: "meta-llama/Llama-2-70b-hf",
		},
	],
	spaces: [
		{
			description: "A robust text generation model that can perform various tasks through natural language prompting.",
			id: "huggingface/bloom_demo",
		},
		{
			description: "An text generation based application that can write code for 80+ languages.",
			id: "bigcode/bigcode-playground",
		},
		{
			description: "An text generation based application for conversations.",
			id: "h2oai/h2ogpt-chatbot",
		},
		{
			description: "An text generation application that combines OpenAI and Hugging Face models.",
			id: "microsoft/HuggingGPT",
		},
		{
			description: "An text generation application that uses StableLM-tuned-alpha-7b.",
			id: "stabilityai/stablelm-tuned-alpha-chat",
		},
		{
			description: "An UI that uses StableLM-tuned-alpha-7b.",
			id: "togethercomputer/OpenChatKit",
		},
	],
	summary:
		"Generating text is the task of producing new text. These models can, for example, fill in incomplete text or paraphrase.",
	widgetModels: ["tiiuae/falcon-7b-instruct"],
	youtubeId: "Vpjb1lu0MDk",
};

export default taskData;