resources.wrappers.FileJsonPyTorch.gate-lf-pytorch-json.gatelfpytorchjson.ngrammodule.py Maven / Gradle / Ivy

Show more of this group Show more artifacts with this name
Show all versions of learningframework Show documentation

A GATE plugin that provides many different machine learning algorithms for a wide range of NLP-related machine learning tasks like text classification, tagging, or chunking.

There is a newer version: 4.2

Show newest version

import torch
import sys
import logging
from gatelfpytorchjson.LayerCNN import LayerCNN

logger = logging.getLogger(__name__)
logger.setLevel(logging.INFO)
streamhandler = logging.StreamHandler(stream=sys.stderr)
formatter = logging.Formatter(
                '%(asctime)s %(name)-12s %(levelname)-8s %(message)s')
streamhandler.setFormatter(formatter)
logger.addHandler(streamhandler)



class NgramModule(torch.nn.Module):

    def __init__(self, embeddingsmodule, config={}):
        """Create a module for processing ngram sequences for the given EmbeddingsModule embeddingsmodule.
        How eventually will be one of  lstm, gru, conv, mean, sum.
        """
        super().__init__()
        self.config = config
        # since we directly assign, this should get registered!
        self.embeddingsmodule = embeddingsmodule
        self.emb_dims = self.embeddingsmodule.emb_dims
        method = config.get("ngram_layer", "cnn")
        if method == "lstm":
            self.forward_method = self.forward_method_lstm
            self.init_method = self.init_method_lstm
        elif method == "cnn":
            self.forward_method = self.forward_method_cnn
            self.init_method = self.init_method_cnn
        # now use the configured init method
        self.init_method()

    def init_method_lstm(self):
        # TODO: maybe use heuristics to find better values for
        # hidden_size
        # num_layers
        # dropout
        # bidirectional
        dropout_prob = self.config.get("dropout", 0.4)
        hidden_size = self.config.get("lstm_hidden", self.embeddingsmodule.emb_dims)
        is_bidir = self.config.get("lstm_bidir", True)
        nr_layers = self.config.get("lstm_nlayers", 1)
        self.lstm = torch.nn.LSTM(input_size=self.embeddingsmodule.emb_dims,
                                  hidden_size=hidden_size,
                                  num_layers=nr_layers,
                                  dropout=dropout_prob,
                                  bidirectional=is_bidir,
                                  batch_first=True)
        # TODO: create a better lstm initialisation vector here for repeated
        # use doring forward, if needed!
        if is_bidir:
            num_directions = 2
        else:
            num_directions = 1
        self.out_dim = hidden_size * nr_layers * num_directions
        logger.info("Created LSTM with out_dim {}".format(self.out_dim))

    def init_method_cnn(self):
        self.cnn = LayerCNN(self.emb_dims, config=self.config)
        self.out_dim = self.cnn.dim_outputs

    def forward_method_lstm(self, batchofsequences):
        batchsize = len(batchofsequences)
        # NOTE: we already expect batchofsequences to be a variable with batch_first zero-padded sequences!
        # now run the data through the embeddings, then run the sequences of embeddings through the lstm
        # Note: the embeddingsmodule.forward method expects the original batchofsequences, we do not need to convert
        # to a tensor and variable here!
        tmp1 = self.embeddingsmodule.forward(batchofsequences)
        out, (h0, c0) = self.lstm(tmp1)  # TODO: for now we use zero vectors for initialization
        # we only need the final hidden state
        # logger.info("out is of shape {}, batchsize={}".format(out.size(), batchsize))
        ret = out[:, -1, :]
        # logger.info("ret is of shape {}".format(ret.size()))
        ret = ret.view(batchsize, -1)
        return ret

    def forward_method_cnn(self, batchofsequences):
        tmp1 = self.embeddingsmodule.forward(batchofsequences)
        out = self.cnn(tmp1)
        return out

    def forward(self, batchofsequences):
        # just delegate to the forward method for the method chosen
        return self.forward_method(batchofsequences)