prasenjeet099 commited on
Commit
e9bf96f
·
verified ·
1 Parent(s): 5b13714

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +42 -0
app.py ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import streamlit as st
2
+ from transformers import AutoModelForSequenceClassification, AutoTokenizer, Trainer, TrainingArguments
3
+ from datasets import load_dataset
4
+
5
+ st.title("Custom AI Model Training on Hugging Face Space")
6
+
7
+ dataset_name = st.text_input("Enter Dataset Name (e.g., prasenjeetz/IQ-Dataset)")
8
+ model_name = st.text_input("Enter Pretrained Model Name (e.g., bert-base-uncased)")
9
+
10
+ if st.button("Start Training"):
11
+ with st.spinner("Loading Dataset..."):
12
+ dataset = load_dataset(dataset_name)
13
+
14
+ tokenizer = AutoTokenizer.from_pretrained(model_name)
15
+
16
+ def tokenize_function(examples):
17
+ return tokenizer(examples["text"], padding="max_length", truncation=True)
18
+
19
+ tokenized_datasets = dataset.map(tokenize_function, batched=True)
20
+
21
+ training_args = TrainingArguments(
22
+ output_dir="./results",
23
+ evaluation_strategy="epoch",
24
+ save_strategy="epoch",
25
+ learning_rate=2e-5,
26
+ per_device_train_batch_size=8,
27
+ per_device_eval_batch_size=8,
28
+ num_train_epochs=3,
29
+ weight_decay=0.01,
30
+ )
31
+
32
+ model = AutoModelForSequenceClassification.from_pretrained(model_name, num_labels=2)
33
+
34
+ trainer = Trainer(
35
+ model=model,
36
+ args=training_args,
37
+ train_dataset=tokenized_datasets["train"],
38
+ eval_dataset=tokenized_datasets["test"],
39
+ )
40
+
41
+ trainer.train()
42
+ st.success("Training Complete!")