flamiry commited on
Commit
27866c0
·
verified ·
1 Parent(s): 3dbf125

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -5
app.py CHANGED
@@ -3,8 +3,10 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
3
  import torch
4
  from datasets import load_dataset
5
  import spaces
 
 
 
6
 
7
- # Load model once at startup
8
  try:
9
  model = AutoModelForCausalLM.from_pretrained("flamiry/first")
10
  tokenizer = AutoTokenizer.from_pretrained("flamiry/first")
@@ -16,11 +18,9 @@ tokenizer.pad_token = tokenizer.eos_token
16
  @spaces.GPU
17
  def train_model():
18
  try:
19
- # Load Slovak data
20
  dataset = load_dataset("DGurgurov/slovak_sa", split="train")
21
  slovak_texts = list(dataset['text'])[:50]
22
 
23
- # Tokenize
24
  inputs = tokenizer(
25
  slovak_texts,
26
  return_tensors="pt",
@@ -29,7 +29,6 @@ def train_model():
29
  max_length=64
30
  )
31
 
32
- # Train
33
  optimizer = torch.optim.Adam(model.parameters(), lr=5e-5)
34
  for epoch in range(2):
35
  optimizer.zero_grad()
@@ -54,7 +53,6 @@ def generate_text(prompt):
54
  except Exception as e:
55
  return f"❌ Error: {str(e)}"
56
 
57
- # Create interface
58
  with gr.Blocks() as demo:
59
  gr.Markdown("# 🇸🇰 Slovak LLM Training")
60
 
 
3
  import torch
4
  from datasets import load_dataset
5
  import spaces
6
+ from huggingface-hub import login
7
+
8
+ login(token=hf_token)
9
 
 
10
  try:
11
  model = AutoModelForCausalLM.from_pretrained("flamiry/first")
12
  tokenizer = AutoTokenizer.from_pretrained("flamiry/first")
 
18
  @spaces.GPU
19
  def train_model():
20
  try:
 
21
  dataset = load_dataset("DGurgurov/slovak_sa", split="train")
22
  slovak_texts = list(dataset['text'])[:50]
23
 
 
24
  inputs = tokenizer(
25
  slovak_texts,
26
  return_tensors="pt",
 
29
  max_length=64
30
  )
31
 
 
32
  optimizer = torch.optim.Adam(model.parameters(), lr=5e-5)
33
  for epoch in range(2):
34
  optimizer.zero_grad()
 
53
  except Exception as e:
54
  return f"❌ Error: {str(e)}"
55
 
 
56
  with gr.Blocks() as demo:
57
  gr.Markdown("# 🇸🇰 Slovak LLM Training")
58