File size: 3,770 Bytes
c27cd1b |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 |
model:
name: sentiment_classifier
type: classification
model:
pretrained_model: xlm-roberta-base
num_labels: 3
dropout: 0.1
hidden_size: 768
labels:
- negative
- neutral
- positive
class_weights: null
tokenizer:
max_length: 256
padding: max_length
truncation: true
add_special_tokens: true
huggingface_hub:
enabled: true
repo_id: anpmts/sentiment-classifier
private: false
create_model_card: true
commit_message: Upload sentiment classifier model
model_card:
language: multilingual
license: apache-2.0
tags:
- sentiment-analysis
- text-classification
- xlm-roberta
- sequence-classification
datasets: null
training:
epochs: 10
batch_size: 128
gradient_accumulation_steps: 1
max_grad_norm: 1.0
distributed:
enabled: true
backend: nccl
find_unused_parameters: true
precision:
mode: bf16
performance:
torch_compile: false
compile_mode: reduce-overhead
cudnn_benchmark: true
gradient_checkpointing: false
tf32: true
flash_attention_2: false
matmul_precision: high
channels_last: false
optimizer:
type: adamw
lr: 2.0e-05
weight_decay: 0.01
eps: 1.0e-08
betas:
- 0.9
- 0.999
fused: false
scheduler:
type: cosine
warmup_ratio: 0.1
warmup_steps: null
num_cycles: 0.5
early_stopping:
enabled: true
patience: 3
min_delta: 0.001
monitor: val_loss
mode: min
checkpoint:
save_top_k: 2
monitor: val_loss
mode: min
save_last: true
every_n_epochs: 1
resume_from_checkpoint: true
pretrained_checkpoint: null
load_only_model: true
eval:
eval_every_n_steps: null
eval_accumulation_steps: 1
dataloader:
num_workers: 0
pin_memory: true
persistent_workers: false
prefetch_factor: null
deterministic: false
benchmark: true
data:
data_source: local
chunked:
enabled: false
train_path: data/amazon_reviews/train
val_path: data/amazon_reviews/validation
test_path: data/amazon_reviews/test
chunk_size: 100000
total_train_samples: 3600000
text_field: text
label_field: sentiment_label
huggingface:
repo: anpmts/trustshop
split_mapping:
train: train
val: validation
test: test
field_mapping:
text: text
sentiment_label: sentiment_label
sentiment_score: sentiment_score
quality_label: quality
config_name: null
revision: null
max_samples: null
local:
data_dir: data/amazon_reviews
processed_dir: data/processed/amazon_reviews
split:
train: 0.7
val: 0.15
test: 0.15
stratify: true
filter_quality:
enabled: false
keep_labels:
- valid
class_balancing:
enabled: false
strategy: oversample
oversample:
sampling_strategy: auto
smote:
k_neighbors: 5
sampling_strategy: auto
augmentation:
enabled: false
techniques:
- synonym_replacement
- random_deletion
- random_swap
augment_ratio: 0.1
preprocessing:
lowercase: false
remove_urls: true
remove_email: true
remove_special_chars: false
min_text_length: 10
cache:
enabled: true
cache_dir: data/.cache/amazon_reviews
seed: 42
validation:
check_missing_fields: false
check_empty_text: true
log_invalid_samples: true
project:
name: ts-train
seed: 42
device: cuda
mixed_precision: true
paths:
data_dir: data
data_file: data/output.jsonl
output_dir: outputs
model_dir: models
log_dir: logs
logging:
use_wandb: true
wandb_project: ts-absa-classification
wandb_entity: null
use_tensorboard: true
log_interval: 10
experiment:
name: null
tags: []
notes: ''
|