Table of Contents

Shortcuts

Tuner¶

This section highlight the key point when using the built-in grid search algorithm.

The tuner class is used to tweak (or tune) hyper parameters, or PyTorch’s module.

from sentarget import Tuner


# Hyper parameters to tune
params = {'epochs': [150],                              # Number of epochs to try
          'lr': np.arange(0.001, 0.3, 0.01).tolist(),   # Make sure to convert it to a list (for saving after)
          'optimizer': ['torch.metrics.Adam'],
          'criterion': ['torch.nn.CrossEntropyLoss']}

# Parameters affecting the models
params_model = {'hidden_dim': [100, 150, 200, 250],      # Model attribute
                'n_layers': [1, 2, 3],                   # Model attribute
                'bidirectional': [False, True],          # Model attribute
                'LSTM.dropout': [0.2, 0.3, 0.4, 0.6],    # Modify all LSTM dropout
                # some other inner parameters, depending on your models...
                }

# Default parameters that will be used to initialize the criterion and optimizer
params_loss = {'ignore_index': PAD_IDX}
params_optim = {}

tuner = Tuner(params, params_loss=params_loss, params_optim=params_optim)

# Run the grid Search
tuner.fit([sentarget.nn.models.gru.BiGRU, sentarget.nn.models.lstm.BiLSTM], train_iterator, eval_iterator)

Grid Search¶

From this class, you can create your own custom grid search function depending on how you preprocess the data:

import torch
from torchtext import data
from torchtext.vocab import Vectors

import sentarget
from sentarget import Tuner
from sentarget.datasets import NoReCfine


def gridsearch(models, params_hyper={}, params_model={}, params_optim={}, params_loss={}):
    """Run the grid search algorithms on the Norwegian NoReCfine dataset provided.

    Args:
        options (dict): general options.
        params_hyper (dict): hyper parameters to tune.
        params_model (dict): model's parameters to tune.
        params_optim (dict): optimizer parameters initialization, won't be tuned.
        params_loss (dict): criterion parameters initialization, won't be tuned.

    """

    # 1/ Load the data
    TEXT = data.Field(lower=False, include_lengths=True, batch_first=True)
    LABEL = data.Field(batch_first=True, unk_token=None)
    FIELDS = [("text", TEXT), ("label", LABEL)]
    train_data, eval_data, test_data = NoReCfine.splits(FIELDS)

    # 2/ Build the vocab
    VOCAB_SIZE = 1_200_000
    VECTORS = Vectors(name='model.txt', url='http://vectors.nlpl.eu/repository/20/58.zip')
    TEXT.build_vocab(train_data, test_data, eval_data,
                     max_size=VOCAB_SIZE,
                     vectors=VECTORS,
                     unk_init=torch.Tensor.normal_)
    LABEL.build_vocab(train_data)

    # 3/ Load iterators
    BATCH_SIZE = params_hyper['batch_size']
    device = torch.device('cpu')
    train_iterator, eval_iterator, test_iterator = data.BucketIterator.splits((train_data, eval_data, test_data),
                                                                              batch_size=BATCH_SIZE,
                                                                              sort_within_batch=True,
                                                                              device=device)

    # ...and initialize the embedding layer
    params_model['embeddings'] = TEXT.vocab.vectors

    # 4/ Initialize the grid search template
    tuner = Tuner(params_hyper, params_model=params_model, params_loss=params_loss, params_optim=params_optim)

    # ...and search !
    tuner.fit(models, train_iterator, eval_iterator, verbose=True, saves=True)
    tuner.save()

And let’s try it out:

# Test these models
models = [sentarget.nn.models.lstm.BiLSTM, sentarget.nn.models.gru.BiGRU]

# Hyper parameters to tune
params_hyper = {
                    # Default parameters
                    'epochs':                    [50, 100],
                    'batch_size':                [64, 128],
                    'lr':                        [0.01, 0.05, 0.1, 0.2],
                    'vectors_name':              'model.txt',
                    'vectors_url':               'http://vectors.nlpl.eu/repository/20/58.zip',
                    'use_pretrained_embeddings': True,
                    'optimizer':                 [torch.optim.Adam],
                    'criterion':                 [torch.nn.CrossEntropyLoss]
                }

# Parameters affecting the model
params_model = {'input_dim':             [len(TEXT.vocab)],     # Should not be modified
                'embedding_dim':         [100],                 # Should not be modified
                'hidden_dim':            [100, 150, 200],
                'output_dim':            [len(LABEL.vocab)],    # Should not be modified
                'n_layers':              [2, 3],
                'bidirectional':         [True, False],
                'dropout':               [0.1, 0.2, 0.3, 0.4],
                'pad_idx_text':          [PAD_IDX_TEXT],        # Should not be modified
                'pad_idx_label':         [PAD_IDX_LABEL],       # Should not be modified
                'unk_idx_text':          [UNK_IDX_TEXT],        # Should not be modified
                'embeddings':            [EMBEDDINGS]}          # Should not be modified

# Parameters used to initialize the loss and optimizer
params_loss = {'ignore_index': PAD_IDX_LABEL}
params_optim = {}

# Run the grid search
gridsearch(models,
           params_hyper = params_hyper,
           params_model = params_model,
           params_loss = params_loss,
           params_optim = params_optim)

Docs

Access comprehensive developer documentation for PyTorch

View Docs

Tutorials

Get in-depth tutorials for beginners and advanced developers

View Tutorials

Resources

Check the GitHub page and contribute to the project

View GitHub