nroggendorff commited on
Commit
d1a06b7
·
verified ·
1 Parent(s): d9dca90

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -7
app.py CHANGED
@@ -60,11 +60,11 @@ print(tokenizer.apply_chat_template([{"role": "user", "content": "Why is the sky
60
 
61
  config = LlamaConfig(
62
  vocab_size=tokenizer.vocab_size,
63
- hidden_size=512 * 2,
64
- intermediate_size=1024 * 2,
65
- num_hidden_layers=8 * 2,
66
- num_attention_heads=8 * 2,
67
- max_position_embeddings=512 * 2,
68
  rms_norm_eps=1e-6,
69
  initializer_range=0.02,
70
  use_cache=True,
@@ -98,8 +98,8 @@ print(dataset['text'][2])
98
 
99
  args = TrainingArguments(
100
  output_dir="mayo",
101
- num_train_epochs=2,
102
- per_device_train_batch_size=16,
103
  gradient_accumulation_steps=4,
104
  learning_rate=1e-5,
105
  save_steps=100000,
 
60
 
61
  config = LlamaConfig(
62
  vocab_size=tokenizer.vocab_size,
63
+ hidden_size=512,
64
+ intermediate_size=1024,
65
+ num_hidden_layers=8,
66
+ num_attention_heads=8,
67
+ max_position_embeddings=512,
68
  rms_norm_eps=1e-6,
69
  initializer_range=0.02,
70
  use_cache=True,
 
98
 
99
  args = TrainingArguments(
100
  output_dir="mayo",
101
+ num_train_epochs=4,
102
+ per_device_train_batch_size=64,
103
  gradient_accumulation_steps=4,
104
  learning_rate=1e-5,
105
  save_steps=100000,