nroggendorff commited on
Commit
de2fc4e
·
verified ·
1 Parent(s): 7fe1c0a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -10,7 +10,7 @@ from datasets import load_dataset
10
  from tokenizers import ByteLevelBPETokenizer
11
  import trl
12
 
13
- dataset = load_dataset("nroggendorff/openhermes", split="train").select(range(int(2e+4)))
14
 
15
  def get_training_corpus():
16
  for i in range(0, len(dataset), 1000):
@@ -61,10 +61,10 @@ print(tokenizer.apply_chat_template([{"role": "user", "content": "Why is the sky
61
  config = LlamaConfig(
62
  vocab_size=tokenizer.vocab_size,
63
  hidden_size=int(512 * 2),
64
- intermediate_size=int(1024 / 1),
65
  num_hidden_layers=int(8 * 2),
66
- num_attention_heads=int(8 / 1),
67
- max_position_embeddings=int(512 / 1),
68
  rms_norm_eps=1e-6,
69
  initializer_range=0.02,
70
  use_cache=True,
 
10
  from tokenizers import ByteLevelBPETokenizer
11
  import trl
12
 
13
+ dataset = load_dataset("nroggendorff/openhermes", split="train").select(range(int(1e+4)))
14
 
15
  def get_training_corpus():
16
  for i in range(0, len(dataset), 1000):
 
61
  config = LlamaConfig(
62
  vocab_size=tokenizer.vocab_size,
63
  hidden_size=int(512 * 2),
64
+ intermediate_size=int(1024 * 2),
65
  num_hidden_layers=int(8 * 2),
66
+ num_attention_heads=int(8 * 2),
67
+ max_position_embeddings=int(512 * 2),
68
  rms_norm_eps=1e-6,
69
  initializer_range=0.02,
70
  use_cache=True,