flamiry commited on
Commit
ce90d74
·
verified ·
1 Parent(s): f0e05e2

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -7
app.py CHANGED
@@ -13,12 +13,11 @@ tokenizer = AutoTokenizer.from_pretrained("flamiry/first")
13
  tokenizer.pad_token = tokenizer.eos_token
14
 
15
  @spaces.GPU
16
- def train_model(start, end):
17
- start = int(start)
18
- end = int(end)
19
  try:
20
- dataset = load_dataset("DGurgurov/slovak_sa", split="train")
21
- slovak_texts = list(dataset['text'])[start:end]
22
 
23
  inputs = tokenizer(
24
  slovak_texts,
@@ -57,8 +56,7 @@ with gr.Blocks() as demo:
57
 
58
  with gr.Tab("Train Model"):
59
  gr.Markdown("Click to train the model on Slovak data")
60
- start_input = gr.Textbox(label="Start")
61
- end_input = gr.Textbox(label="End")
62
  train_btn = gr.Button("Start Training", variant="primary")
63
  train_output = gr.Textbox(label="Result", interactive=False)
64
  train_btn.click(train_model, inputs=[start_input,end_input] ,outputs=train_output)
 
13
  tokenizer.pad_token = tokenizer.eos_token
14
 
15
  @spaces.GPU
16
+ def train_model(number):
17
+ number = int(number)
 
18
  try:
19
+ dataset = load_dataset("allenai/c4", "sk", split="train", streaming=True)
20
+ slovak_texts = list(dataset.take(number))
21
 
22
  inputs = tokenizer(
23
  slovak_texts,
 
56
 
57
  with gr.Tab("Train Model"):
58
  gr.Markdown("Click to train the model on Slovak data")
59
+ number_input = gr.Textbox(label="Kol-vo textov")
 
60
  train_btn = gr.Button("Start Training", variant="primary")
61
  train_output = gr.Textbox(label="Result", interactive=False)
62
  train_btn.click(train_model, inputs=[start_input,end_input] ,outputs=train_output)