anpmts
/

sentiment-classifier

sentiment-classifier

Generated from Trainer

Model card Files Files and versions

sentiment-classifier / config.yaml

anpmts's picture

Upload sentiment classifier model

c27cd1b verified 4 months ago

history blame contribute delete

3.77 kB

	model:
	name: sentiment_classifier
	type: classification
	model:
	pretrained_model: xlm-roberta-base
	num_labels: 3
	dropout: 0.1
	hidden_size: 768
	labels:
	- negative
	- neutral
	- positive
	class_weights: null
	tokenizer:
	max_length: 256
	padding: max_length
	truncation: true
	add_special_tokens: true
	huggingface_hub:
	enabled: true
	repo_id: anpmts/sentiment-classifier
	private: false
	create_model_card: true
	commit_message: Upload sentiment classifier model
	model_card:
	language: multilingual
	license: apache-2.0
	tags:
	- sentiment-analysis
	- text-classification
	- xlm-roberta
	- sequence-classification
	datasets: null
	training:
	epochs: 10
	batch_size: 128
	gradient_accumulation_steps: 1
	max_grad_norm: 1.0
	distributed:
	enabled: true
	backend: nccl
	find_unused_parameters: true
	precision:
	mode: bf16
	performance:
	torch_compile: false
	compile_mode: reduce-overhead
	cudnn_benchmark: true
	gradient_checkpointing: false
	tf32: true
	flash_attention_2: false
	matmul_precision: high
	channels_last: false
	optimizer:
	type: adamw
	lr: 2.0e-05
	weight_decay: 0.01
	eps: 1.0e-08
	betas:
	- 0.9
	- 0.999
	fused: false
	scheduler:
	type: cosine
	warmup_ratio: 0.1
	warmup_steps: null
	num_cycles: 0.5
	early_stopping:
	enabled: true
	patience: 3
	min_delta: 0.001
	monitor: val_loss
	mode: min
	checkpoint:
	save_top_k: 2
	monitor: val_loss
	mode: min
	save_last: true
	every_n_epochs: 1
	resume_from_checkpoint: true
	pretrained_checkpoint: null
	load_only_model: true
	eval:
	eval_every_n_steps: null
	eval_accumulation_steps: 1
	dataloader:
	num_workers: 0
	pin_memory: true
	persistent_workers: false
	prefetch_factor: null
	deterministic: false
	benchmark: true
	data:
	data_source: local
	chunked:
	enabled: false
	train_path: data/amazon_reviews/train
	val_path: data/amazon_reviews/validation
	test_path: data/amazon_reviews/test
	chunk_size: 100000
	total_train_samples: 3600000
	text_field: text
	label_field: sentiment_label
	huggingface:
	repo: anpmts/trustshop
	split_mapping:
	train: train
	val: validation
	test: test
	field_mapping:
	text: text
	sentiment_label: sentiment_label
	sentiment_score: sentiment_score
	quality_label: quality
	config_name: null
	revision: null
	max_samples: null
	local:
	data_dir: data/amazon_reviews
	processed_dir: data/processed/amazon_reviews
	split:
	train: 0.7
	val: 0.15
	test: 0.15
	stratify: true
	filter_quality:
	enabled: false
	keep_labels:
	- valid
	class_balancing:
	enabled: false
	strategy: oversample
	oversample:
	sampling_strategy: auto
	smote:
	k_neighbors: 5
	sampling_strategy: auto
	augmentation:
	enabled: false
	techniques:
	- synonym_replacement
	- random_deletion
	- random_swap
	augment_ratio: 0.1
	preprocessing:
	lowercase: false
	remove_urls: true
	remove_email: true
	remove_special_chars: false
	min_text_length: 10
	cache:
	enabled: true
	cache_dir: data/.cache/amazon_reviews
	seed: 42
	validation:
	check_missing_fields: false
	check_empty_text: true
	log_invalid_samples: true
	project:
	name: ts-train
	seed: 42
	device: cuda
	mixed_precision: true
	paths:
	data_dir: data
	data_file: data/output.jsonl
	output_dir: outputs
	model_dir: models
	log_dir: logs
	logging:
	use_wandb: true
	wandb_project: ts-absa-classification
	wandb_entity: null
	use_tensorboard: true
	log_interval: 10
	experiment:
	name: null
	tags: []
	notes: ''