nroggendorff commited on
Commit
c987618
·
verified ·
1 Parent(s): aa4a704

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -5
app.py CHANGED
@@ -59,10 +59,10 @@ print(tokenizer.apply_chat_template([{"role": "user", "content": "Why is the sky
59
 
60
  config = LlamaConfig(
61
  vocab_size=tokenizer.vocab_size,
62
- hidden_size=int(512 / 1),
63
- intermediate_size=int(1024 / 1),
64
- num_hidden_layers=int(8 / 1),
65
- num_attention_heads=int(8 / 1),
66
  max_position_embeddings=int(512 / 1),
67
  rms_norm_eps=1e-6,
68
  initializer_range=0.02,
@@ -97,7 +97,7 @@ print(dataset['text'][2])
97
 
98
  args = TrainingArguments(
99
  output_dir="mayo",
100
- num_train_epochs=4,
101
  gradient_accumulation_steps=4,
102
  per_device_train_batch_size=1,
103
  learning_rate=1e-5,
 
59
 
60
  config = LlamaConfig(
61
  vocab_size=tokenizer.vocab_size,
62
+ hidden_size=int(512 / 4),
63
+ intermediate_size=int(1024 / 4),
64
+ num_hidden_layers=int(8 / 4),
65
+ num_attention_heads=int(8 / 4),
66
  max_position_embeddings=int(512 / 1),
67
  rms_norm_eps=1e-6,
68
  initializer_range=0.02,
 
97
 
98
  args = TrainingArguments(
99
  output_dir="mayo",
100
+ num_train_epochs=1,
101
  gradient_accumulation_steps=4,
102
  per_device_train_batch_size=1,
103
  learning_rate=1e-5,