model: name: sentiment_classifier type: classification model: pretrained_model: xlm-roberta-base num_labels: 3 dropout: 0.1 hidden_size: 768 labels: - negative - neutral - positive class_weights: null tokenizer: max_length: 256 padding: max_length truncation: true add_special_tokens: true huggingface_hub: enabled: true repo_id: anpmts/sentiment-classifier private: false create_model_card: true commit_message: Upload sentiment classifier model model_card: language: multilingual license: apache-2.0 tags: - sentiment-analysis - text-classification - xlm-roberta - sequence-classification datasets: null training: epochs: 10 batch_size: 128 gradient_accumulation_steps: 1 max_grad_norm: 1.0 distributed: enabled: true backend: nccl find_unused_parameters: true precision: mode: bf16 performance: torch_compile: false compile_mode: reduce-overhead cudnn_benchmark: true gradient_checkpointing: false tf32: true flash_attention_2: false matmul_precision: high channels_last: false optimizer: type: adamw lr: 2.0e-05 weight_decay: 0.01 eps: 1.0e-08 betas: - 0.9 - 0.999 fused: false scheduler: type: cosine warmup_ratio: 0.1 warmup_steps: null num_cycles: 0.5 early_stopping: enabled: true patience: 3 min_delta: 0.001 monitor: val_loss mode: min checkpoint: save_top_k: 2 monitor: val_loss mode: min save_last: true every_n_epochs: 1 resume_from_checkpoint: true pretrained_checkpoint: null load_only_model: true eval: eval_every_n_steps: null eval_accumulation_steps: 1 dataloader: num_workers: 0 pin_memory: true persistent_workers: false prefetch_factor: null deterministic: false benchmark: true data: data_source: local chunked: enabled: false train_path: data/amazon_reviews/train val_path: data/amazon_reviews/validation test_path: data/amazon_reviews/test chunk_size: 100000 total_train_samples: 3600000 text_field: text label_field: sentiment_label huggingface: repo: anpmts/trustshop split_mapping: train: train val: validation test: test field_mapping: text: text sentiment_label: sentiment_label sentiment_score: sentiment_score quality_label: quality config_name: null revision: null max_samples: null local: data_dir: data/amazon_reviews processed_dir: data/processed/amazon_reviews split: train: 0.7 val: 0.15 test: 0.15 stratify: true filter_quality: enabled: false keep_labels: - valid class_balancing: enabled: false strategy: oversample oversample: sampling_strategy: auto smote: k_neighbors: 5 sampling_strategy: auto augmentation: enabled: false techniques: - synonym_replacement - random_deletion - random_swap augment_ratio: 0.1 preprocessing: lowercase: false remove_urls: true remove_email: true remove_special_chars: false min_text_length: 10 cache: enabled: true cache_dir: data/.cache/amazon_reviews seed: 42 validation: check_missing_fields: false check_empty_text: true log_invalid_samples: true project: name: ts-train seed: 42 device: cuda mixed_precision: true paths: data_dir: data data_file: data/output.jsonl output_dir: outputs model_dir: models log_dir: logs logging: use_wandb: true wandb_project: ts-absa-classification wandb_entity: null use_tensorboard: true log_interval: 10 experiment: name: null tags: [] notes: ''