THUIAR
/

TEXTOIR

Model card Files Files and versions

TEXTOIR / TEXTOIR-main /open_intent_discovery /configs /SemiUSNID.py

THU-IAR's picture

Upload 198 files

2d06dcc verified over 1 year ago

history blame contribute delete

5.05 kB

	class Param():

	def __init__(self, args):

	self.hyper_param = self.get_hyper_parameters(args)

	def get_hyper_parameters(self, args):
	"""
	Args:
	bert_model (directory): The path for the pre-trained bert model.
	max_seq_length (autofill): The maximum total input sequence length after tokenization. Sequences longer than this will be truncated, sequences shorter will be padded.
	num_train_epochs (int): The number of training epochs.
	num_pretrain_epochs (int): The number of pre-training epochs.
	num_labels (autofill): The output dimension.
	freeze_bert_parameters (binary): Whether to freeze all parameters but the last layer.
	feat_dim (int): The feature dimension.
	warmup_proportion (float): The warmup ratio for learning rate.
	lr_pre (float): The learning rate for pre-training the backbone.
	lr (float): The learning rate for training the backbone.
	loss_fct (str): The loss function for training.
	activation (str): The activation function of the hidden layer (support 'relu' and 'tanh').
	train_batch_size (int): The batch size for training.
	eval_batch_size (int): The batch size for evaluation.
	test_batch_size (int): The batch size for testing.
	wait_patient (int): Patient steps for Early Stop.
	"""
	print("==============", args.dataset)
	if args.dataset == 'banking':
	print("==============banking config")
	hyper_parameters = {
	'pretrained_bert_model': '/home/sharing/disk1/pretrained_embedding/bert/uncased_L-12_H-768_A-12/',
	'max_seq_length': None,
	'num_pretrain_epochs': 100,
	'num_train_epochs': 100,
	'num_labels': None,
	'pretrain': True,
	'freeze_pretrain_bert_parameters': True,
	'freeze_train_bert_parameters': False,
	'feat_dim': 768,
	'warmup_proportion': 0.1,
	'lr_pre': 5e-5,
	'lr': 1e-5,
	'loss_fct': 'CrossEntropyLoss',
	'pretrain_temperature': 0.07,
	'train_temperature': 0.05,
	're_prob': 0.4,
	'activation': 'tanh',
	'tol': 0.0005,
	'grad_clip': 1.0,
	'train_batch_size': 128,
	'pretrain_batch_size': 128,
	'eval_batch_size': 64,
	'test_batch_size': 64,
	'wait_patient': 10,
	}
	elif args.dataset == 'clinc':
	print("==============clinc config")
	hyper_parameters = {
	'pretrained_bert_model': '/home/sharing/disk1/pretrained_embedding/bert/uncased_L-12_H-768_A-12/',
	'max_seq_length': None,
	'num_pretrain_epochs': 100,
	'num_train_epochs': 100,
	'num_labels': None,
	'pretrain': True,
	'freeze_pretrain_bert_parameters': True,
	'freeze_train_bert_parameters': False,
	'feat_dim': 768,
	'warmup_proportion': 0.1,
	'lr_pre': 5e-5,
	'lr': 1e-5,
	'loss_fct': 'CrossEntropyLoss',
	'pretrain_temperature': 0.07,
	'train_temperature': 0.1,
	're_prob': 0.4,
	'activation': 'tanh',
	'tol': 0.0005,
	'grad_clip': 1.0,
	'train_batch_size': 128,
	'pretrain_batch_size': 128,
	'eval_batch_size': 64,
	'test_batch_size': 64,
	'wait_patient': 10,
	}
	elif args.dataset == 'stackoverflow':
	print("==============stackoverflow config")
	hyper_parameters = {
	'pretrained_bert_model': '/home/sharing/disk1/pretrained_embedding/bert/uncased_L-12_H-768_A-12/',
	'max_seq_length': None,
	'num_pretrain_epochs': 100,
	'num_train_epochs': 100,
	'num_labels': None,
	'pretrain': True,
	'freeze_pretrain_bert_parameters': True,
	'freeze_train_bert_parameters': False,
	'feat_dim': 768,
	'warmup_proportion': 0.1,
	'lr_pre': 5e-5,
	'lr': 2e-5,
	'loss_fct': 'CrossEntropyLoss',
	'pretrain_temperature': 0.07,
	'train_temperature': 0.05,
	're_prob': 0.4,
	'activation': ['tanh'],
	'tol': [0.0005],
	'grad_clip': [1.0],
	'train_batch_size': 128,
	'pretrain_batch_size': 128,
	'eval_batch_size': 64,
	'test_batch_size': 64,
	'wait_patient': 10,
	}

	return hyper_parameters