yagnik12 commited on
Commit
f124c80
·
verified ·
1 Parent(s): b5d99e6

Update train.py

Browse files
Files changed (1) hide show
  1. train.py +10 -3
train.py CHANGED
@@ -1,6 +1,13 @@
1
  from datasets import load_dataset
2
  from transformers import AutoTokenizer, AutoModelForSequenceClassification, Trainer, TrainingArguments
3
  import evaluate
 
 
 
 
 
 
 
4
 
5
  # 1. Load BiScope dataset
6
  dataset = load_dataset("HanxiGuo/BiScope_Data")
@@ -14,7 +21,7 @@ def preprocess(examples):
14
 
15
  encoded_dataset = dataset.map(preprocess, batched=True)
16
 
17
- # 3. Load model
18
  model = AutoModelForSequenceClassification.from_pretrained(MODEL, num_labels=2)
19
 
20
  # 4. Metrics
@@ -35,8 +42,8 @@ training_args = TrainingArguments(
35
  per_device_eval_batch_size=16,
36
  num_train_epochs=2,
37
  weight_decay=0.01,
38
- push_to_hub=True, # ✅ Upload to HF
39
- hub_model_id="yagnik12/AI_Text_Detecter_HanxiGuo_BiScope-Data"
40
  )
41
 
42
  # 6. Trainer
 
1
  from datasets import load_dataset
2
  from transformers import AutoTokenizer, AutoModelForSequenceClassification, Trainer, TrainingArguments
3
  import evaluate
4
+ from huggingface_hub import login
5
+
6
+ # 🔑 Login to Hugging Face (add HF_TOKEN as a secret in your Space settings)
7
+ import os
8
+ hf_token = os.getenv("HF_TOKEN")
9
+ if hf_token:
10
+ login(hf_token)
11
 
12
  # 1. Load BiScope dataset
13
  dataset = load_dataset("HanxiGuo/BiScope_Data")
 
21
 
22
  encoded_dataset = dataset.map(preprocess, batched=True)
23
 
24
+ # 3. Model
25
  model = AutoModelForSequenceClassification.from_pretrained(MODEL, num_labels=2)
26
 
27
  # 4. Metrics
 
42
  per_device_eval_batch_size=16,
43
  num_train_epochs=2,
44
  weight_decay=0.01,
45
+ push_to_hub=True,
46
+ hub_model_id="yagnik12/biscope-detector"
47
  )
48
 
49
  # 6. Trainer