File size: 3,770 Bytes
c27cd1b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
model:
  name: sentiment_classifier
  type: classification
  model:
    pretrained_model: xlm-roberta-base
    num_labels: 3
    dropout: 0.1
    hidden_size: 768
  labels:
  - negative
  - neutral
  - positive
  class_weights: null
  tokenizer:
    max_length: 256
    padding: max_length
    truncation: true
    add_special_tokens: true
  huggingface_hub:
    enabled: true
    repo_id: anpmts/sentiment-classifier
    private: false
    create_model_card: true
    commit_message: Upload sentiment classifier model
    model_card:
      language: multilingual
      license: apache-2.0
      tags:
      - sentiment-analysis
      - text-classification
      - xlm-roberta
      - sequence-classification
      datasets: null
training:
  epochs: 10
  batch_size: 128
  gradient_accumulation_steps: 1
  max_grad_norm: 1.0
  distributed:
    enabled: true
    backend: nccl
    find_unused_parameters: true
  precision:
    mode: bf16
  performance:
    torch_compile: false
    compile_mode: reduce-overhead
    cudnn_benchmark: true
    gradient_checkpointing: false
    tf32: true
    flash_attention_2: false
    matmul_precision: high
    channels_last: false
  optimizer:
    type: adamw
    lr: 2.0e-05
    weight_decay: 0.01
    eps: 1.0e-08
    betas:
    - 0.9
    - 0.999
    fused: false
  scheduler:
    type: cosine
    warmup_ratio: 0.1
    warmup_steps: null
    num_cycles: 0.5
  early_stopping:
    enabled: true
    patience: 3
    min_delta: 0.001
    monitor: val_loss
    mode: min
  checkpoint:
    save_top_k: 2
    monitor: val_loss
    mode: min
    save_last: true
    every_n_epochs: 1
  resume_from_checkpoint: true
  pretrained_checkpoint: null
  load_only_model: true
  eval:
    eval_every_n_steps: null
    eval_accumulation_steps: 1
  dataloader:
    num_workers: 0
    pin_memory: true
    persistent_workers: false
    prefetch_factor: null
  deterministic: false
  benchmark: true
data:
  data_source: local
  chunked:
    enabled: false
    train_path: data/amazon_reviews/train
    val_path: data/amazon_reviews/validation
    test_path: data/amazon_reviews/test
    chunk_size: 100000
    total_train_samples: 3600000
    text_field: text
    label_field: sentiment_label
  huggingface:
    repo: anpmts/trustshop
    split_mapping:
      train: train
      val: validation
      test: test
    field_mapping:
      text: text
      sentiment_label: sentiment_label
      sentiment_score: sentiment_score
      quality_label: quality
    config_name: null
    revision: null
    max_samples: null
  local:
    data_dir: data/amazon_reviews
    processed_dir: data/processed/amazon_reviews
  split:
    train: 0.7
    val: 0.15
    test: 0.15
    stratify: true
  filter_quality:
    enabled: false
    keep_labels:
    - valid
  class_balancing:
    enabled: false
    strategy: oversample
    oversample:
      sampling_strategy: auto
    smote:
      k_neighbors: 5
      sampling_strategy: auto
  augmentation:
    enabled: false
    techniques:
    - synonym_replacement
    - random_deletion
    - random_swap
    augment_ratio: 0.1
  preprocessing:
    lowercase: false
    remove_urls: true
    remove_email: true
    remove_special_chars: false
    min_text_length: 10
  cache:
    enabled: true
    cache_dir: data/.cache/amazon_reviews
  seed: 42
  validation:
    check_missing_fields: false
    check_empty_text: true
    log_invalid_samples: true
project:
  name: ts-train
  seed: 42
  device: cuda
  mixed_precision: true
paths:
  data_dir: data
  data_file: data/output.jsonl
  output_dir: outputs
  model_dir: models
  log_dir: logs
logging:
  use_wandb: true
  wandb_project: ts-absa-classification
  wandb_entity: null
  use_tensorboard: true
  log_interval: 10
experiment:
  name: null
  tags: []
  notes: ''