configs/multi_turn/mag_bert_MIntRec2.py

class Param():
    
    def __init__(self, args):
        
        self.hyper_param = self._get_hyper_parameters(args)
        
    def _get_hyper_parameters(self, args):
        """
        Args:
            num_train_epochs (int): The number of training epochs.
            num_labels (autofill): The output dimension.
            max_seq_length (autofill): The maximum total input sequence length after tokenization. Sequences longer than this will be truncated, sequences shorter will be padded.
            freeze_backbone_parameters (binary): Whether to freeze all parameters but the last layer.
            feat_dim (int): The feature dimension.
            warmup_proportion (float): The warmup ratio for learning rate.
            activation (str): The activation function of the hidden layer (support 'relu' and 'tanh').
            train_batch_size (int): The batch size for training.
            eval_batch_size (int): The batch size for evaluation. 
            test_batch_size (int): The batch size for testing.
            wait_patient (int): Patient steps for Early Stop.
        """

        if args.text_backbone.startswith('bert'):

            hyper_parameters = {
                'need_aligned': True,
                'eval_monitor': ['acc'],
                'train_batch_size': [2],
                'select_bs': [16],
                'eval_batch_size': 2,
                'test_batch_size': 2,
                'wait_patience': [3],
                'num_train_epochs': [40],
                'context_len': [0.5],  
                'beta_shift': [0.05],
                'dropout_prob': [0.05],
                'warmup_proportion': [0.01],
                'lr': [4e-6],
                'aligned_method': ['conv1d'],   
                'weight_decay': [0.1], 
                'scale': [1],
                'alpha' : [1],
                'beta' : [0.1]
            } 
        else:
            raise ValueError('Not supported text backbone')        
        
        return hyper_parameters