| model: | |
| name: sentiment_classifier | |
| type: classification | |
| model: | |
| pretrained_model: xlm-roberta-base | |
| num_labels: 3 | |
| dropout: 0.1 | |
| hidden_size: 768 | |
| labels: | |
| - negative | |
| - neutral | |
| - positive | |
| class_weights: null | |
| tokenizer: | |
| max_length: 256 | |
| padding: max_length | |
| truncation: true | |
| add_special_tokens: true | |
| huggingface_hub: | |
| enabled: true | |
| repo_id: anpmts/sentiment-classifier | |
| private: false | |
| create_model_card: true | |
| commit_message: Upload sentiment classifier model | |
| model_card: | |
| language: multilingual | |
| license: apache-2.0 | |
| tags: | |
| - sentiment-analysis | |
| - text-classification | |
| - xlm-roberta | |
| - sequence-classification | |
| datasets: null | |
| training: | |
| epochs: 10 | |
| batch_size: 128 | |
| gradient_accumulation_steps: 1 | |
| max_grad_norm: 1.0 | |
| distributed: | |
| enabled: true | |
| backend: nccl | |
| find_unused_parameters: true | |
| precision: | |
| mode: bf16 | |
| performance: | |
| torch_compile: false | |
| compile_mode: reduce-overhead | |
| cudnn_benchmark: true | |
| gradient_checkpointing: false | |
| tf32: true | |
| flash_attention_2: false | |
| matmul_precision: high | |
| channels_last: false | |
| optimizer: | |
| type: adamw | |
| lr: 2.0e-05 | |
| weight_decay: 0.01 | |
| eps: 1.0e-08 | |
| betas: | |
| - 0.9 | |
| - 0.999 | |
| fused: false | |
| scheduler: | |
| type: cosine | |
| warmup_ratio: 0.1 | |
| warmup_steps: null | |
| num_cycles: 0.5 | |
| early_stopping: | |
| enabled: true | |
| patience: 3 | |
| min_delta: 0.001 | |
| monitor: val_loss | |
| mode: min | |
| checkpoint: | |
| save_top_k: 2 | |
| monitor: val_loss | |
| mode: min | |
| save_last: true | |
| every_n_epochs: 1 | |
| resume_from_checkpoint: true | |
| pretrained_checkpoint: null | |
| load_only_model: true | |
| eval: | |
| eval_every_n_steps: null | |
| eval_accumulation_steps: 1 | |
| dataloader: | |
| num_workers: 0 | |
| pin_memory: true | |
| persistent_workers: false | |
| prefetch_factor: null | |
| deterministic: false | |
| benchmark: true | |
| data: | |
| data_source: local | |
| chunked: | |
| enabled: false | |
| train_path: data/amazon_reviews/train | |
| val_path: data/amazon_reviews/validation | |
| test_path: data/amazon_reviews/test | |
| chunk_size: 100000 | |
| total_train_samples: 3600000 | |
| text_field: text | |
| label_field: sentiment_label | |
| huggingface: | |
| repo: anpmts/trustshop | |
| split_mapping: | |
| train: train | |
| val: validation | |
| test: test | |
| field_mapping: | |
| text: text | |
| sentiment_label: sentiment_label | |
| sentiment_score: sentiment_score | |
| quality_label: quality | |
| config_name: null | |
| revision: null | |
| max_samples: null | |
| local: | |
| data_dir: data/amazon_reviews | |
| processed_dir: data/processed/amazon_reviews | |
| split: | |
| train: 0.7 | |
| val: 0.15 | |
| test: 0.15 | |
| stratify: true | |
| filter_quality: | |
| enabled: false | |
| keep_labels: | |
| - valid | |
| class_balancing: | |
| enabled: false | |
| strategy: oversample | |
| oversample: | |
| sampling_strategy: auto | |
| smote: | |
| k_neighbors: 5 | |
| sampling_strategy: auto | |
| augmentation: | |
| enabled: false | |
| techniques: | |
| - synonym_replacement | |
| - random_deletion | |
| - random_swap | |
| augment_ratio: 0.1 | |
| preprocessing: | |
| lowercase: false | |
| remove_urls: true | |
| remove_email: true | |
| remove_special_chars: false | |
| min_text_length: 10 | |
| cache: | |
| enabled: true | |
| cache_dir: data/.cache/amazon_reviews | |
| seed: 42 | |
| validation: | |
| check_missing_fields: false | |
| check_empty_text: true | |
| log_invalid_samples: true | |
| project: | |
| name: ts-train | |
| seed: 42 | |
| device: cuda | |
| mixed_precision: true | |
| paths: | |
| data_dir: data | |
| data_file: data/output.jsonl | |
| output_dir: outputs | |
| model_dir: models | |
| log_dir: logs | |
| logging: | |
| use_wandb: true | |
| wandb_project: ts-absa-classification | |
| wandb_entity: null | |
| use_tensorboard: true | |
| log_interval: 10 | |
| experiment: | |
| name: null | |
| tags: [] | |
| notes: '' | |