Added some more Code level comments to AllenNLP Model

5 years ago · 49dec048c8
parent 891c6f2828
commit 49dec048c8
1 changed files with 59 additions and 0 deletions
--- a/classifier/nn.py
+++ b/classifier/nn.py
@ -15,6 +15,24 @@ from torch.nn import Parameter
@Model.register("basic_bilstm_classifier")
 class BiLstmClassifier(Model):

+    """
+    Two things to note first:
+        - This BiLstmClassifier is a subclass of AllenNLP's Model class
+        - This class registers the type "basic_bilstm_classifier"  using @Model.register() decorator,
+            this is required for the Config file to identify the Model class.
+
+    AllenNLP Model is similar to PyTorch Module, it implements forward() method and returns an output dictionary
+    with loss, logits and more....
+
+    The constructor parameters should match with configuration in the config file, the Vocabulary is composed by
+    the library or train pipeline after reading data using Dataset Reader.
+
+     In this model, we used Elmo embeddings, 1 layer BiLSTM (encoder) and 2 Feed-forward layers.
+     The train command/pipeline calls the forward method for a batch of Instances,
+     and the forward method returns the output dictionary with loss, logits, label and F1 metrics
+
+    """
+
    def __init__(self, vocab: Vocabulary,
                 text_field_embedder: TextFieldEmbedder,
                 encoder: Seq2SeqEncoder,
@ -32,6 +50,7 @@ class BiLstmClassifier(Model):

        self.label_f1_metrics = {}

+        # create F1 Measures for each class
        for i in range(self.num_classes):
            self.label_f1_metrics[vocab.get_token_from_index(index=i, namespace="labels")] = \
                F1Measure(positive_label=i)
@ -44,7 +63,17 @@ class BiLstmClassifier(Model):
    def forward(self, tokens: Dict[str, torch.LongTensor],
                label: torch.LongTensor) -> Dict[str, torch.LongTensor]:

+        """
+        The training loop takes a batch of Instances and passes it to the forward method
+
+        :param tokens: tokens from the Instance
+        :param label: label from the data Instance
+
+        :return: returns an output dictionary after forwarding inputs to the model
+        """
+
        input_elmo = None
+        # pop the "elmo" key and add it later
        elmo_tokens = tokens.pop("elmo", None)

        embedded_text = self.text_field_embedder(tokens)
@ -56,6 +85,7 @@ class BiLstmClassifier(Model):
            # Create ELMo embeddings if applicable
            if self.elmo:
                if elmo_tokens is not None:
+                    # get elmo representations from Tokens
                    elmo_representations = self.elmo(elmo_tokens["elmo_tokens"])["elmo_representations"]
                    if self.use_elmo:
                        input_elmo = elmo_representations.pop()
@ -69,6 +99,7 @@ class BiLstmClassifier(Model):
                else:
                    embedded_text = input_elmo

+        # pass the embedded text to the LSTM encoder
        encoded_text = self.encoder(embedded_text, text_mask)

        # Attention
@ -77,10 +108,13 @@ class BiLstmClassifier(Model):
        output_dict = {}
        if label is not None:
            logits = self.classifier_feed_forward(encoded_text)
+
+            # Probabilities from Softmax
            class_probabilities = torch.nn.functional.softmax(logits, dim=1)

            output_dict["logits"] = logits

+            # loss calculation
            loss = self.loss(logits, label)
            output_dict["loss"] = loss

@ -96,19 +130,44 @@ class BiLstmClassifier(Model):

    @overrides
    def make_output_human_readable(self, output_dict: Dict[str, torch.Tensor]) -> Dict[str, torch.Tensor]:
+        """
+
+        The predict command/pipeline calls this method with the output dictionary from forward() method.
+
+        The returned output dictionary will also be printed in the console when the predict command is executed
+
+        :param output_dict: output dictionary
+        :return: returns human readable output dictionary
+        """
        class_probabilities = torch.nn.functional.softmax(output_dict['logits'], dim=-1)
        predictions = class_probabilities.cpu().data.numpy()
        argmax_indices = np.argmax(predictions, axis=-1)
+
+        # get the label from vocabulary
        label = [self.vocab.get_token_from_index(x, namespace="labels")
                 for x in argmax_indices]
        output_dict['probabilities'] = class_probabilities
        output_dict['positive_label'] = label
        output_dict['prediction'] = label

+        # return ouput dictionary
        return output_dict

    @overrides
    def get_metrics(self, reset: bool = False) -> Dict[str, float]:
+
+        """
+
+        This method gets a call from the train pipeline,
+        and the returned metrics dictionary will be printed in the Console while Training.
+
+        The returned metrics dictionary contains class-wise F1 Scores, Average F1 score and loss
+
+        :param reset: boolean
+
+        :return: returns a metrics dictionary with Class Level F1 scores and losses
+        """
+
        metric_dict = {}

        sum_f1 = 0.0