Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -10,7 +10,7 @@ from datasets import load_dataset
|
|
10 |
from tokenizers import ByteLevelBPETokenizer
|
11 |
import trl
|
12 |
|
13 |
-
dataset = load_dataset("nroggendorff/openhermes", split="train").select(range(int(
|
14 |
|
15 |
def get_training_corpus():
|
16 |
for i in range(0, len(dataset), 1000):
|
@@ -61,10 +61,10 @@ print(tokenizer.apply_chat_template([{"role": "user", "content": "Why is the sky
|
|
61 |
config = LlamaConfig(
|
62 |
vocab_size=tokenizer.vocab_size,
|
63 |
hidden_size=int(512 * 2),
|
64 |
-
intermediate_size=int(1024
|
65 |
num_hidden_layers=int(8 * 2),
|
66 |
-
num_attention_heads=int(8
|
67 |
-
max_position_embeddings=int(512
|
68 |
rms_norm_eps=1e-6,
|
69 |
initializer_range=0.02,
|
70 |
use_cache=True,
|
|
|
10 |
from tokenizers import ByteLevelBPETokenizer
|
11 |
import trl
|
12 |
|
13 |
+
dataset = load_dataset("nroggendorff/openhermes", split="train").select(range(int(1e+4)))
|
14 |
|
15 |
def get_training_corpus():
|
16 |
for i in range(0, len(dataset), 1000):
|
|
|
61 |
config = LlamaConfig(
|
62 |
vocab_size=tokenizer.vocab_size,
|
63 |
hidden_size=int(512 * 2),
|
64 |
+
intermediate_size=int(1024 * 2),
|
65 |
num_hidden_layers=int(8 * 2),
|
66 |
+
num_attention_heads=int(8 * 2),
|
67 |
+
max_position_embeddings=int(512 * 2),
|
68 |
rms_norm_eps=1e-6,
|
69 |
initializer_range=0.02,
|
70 |
use_cache=True,
|