Add repr to RNNs and Embedding (pytorch#428)

adamlerer · soumith · commit 3152be5fb365 · 2017-01-13T15:53:52.000-05:00
diff --git a/torch/nn/modules/rnn.py b/torch/nn/modules/rnn.py
@@ -69,16 +69,31 @@ def forward(self, input, hx):
         )
         return func(input, self.all_weights, hx)
 
+    def __repr__(self):
+        s = '{name}({input_size}, {hidden_size}'
+        if self.num_layers != 1:
+            s += ', num_layers={num_layers}'
+        if self.bias is not True:
+            s += ', bias={bias}'
+        if self.batch_first is not False:
+            s += ', batch_first={batch_first}'
+        if self.dropout != 0:
+            s += ', dropout={dropout}'
+        if self.bidirectional is not False:
+            s += ', bidirectional={bidirectional}'
+        s += ')'
+        return s.format(name=self.__class__.__name__, **self.__dict__)
+
 
 class RNN(RNNBase):
     r"""Applies a multi-layer Elman RNN with tanh or ReLU non-linearity to an input sequence.
 
 
     For each element in the input sequence, each layer computes the following
     function:
-    
+
     .. math::
-    
+
         h_t = \tanh(w_{ih} * x_t + b_{ih}  +  w_{hh} * h_{(t-1)} + b_{hh})
 
     where :math:`h_t` is the hidden state at time `t`, and :math:`x_t` is the hidden
@@ -104,9 +119,9 @@ class RNN(RNNBase):
         - `h_n`: A (num_layers x batch x hidden_size) tensor containing the hidden state for k=seq_len
 
     Attributes:
-        weight_ih_l[k]: the learnable input-hidden weights of the k-th layer, 
+        weight_ih_l[k]: the learnable input-hidden weights of the k-th layer,
                         of shape `(input_size x hidden_size)`
-        weight_hh_l[k]: the learnable hidden-hidden weights of the k-th layer, 
+        weight_hh_l[k]: the learnable hidden-hidden weights of the k-th layer,
                         of shape `(hidden_size x hidden_size)`
         bias_ih_l[k]: the learnable input-hidden bias of the k-th layer, of shape `(hidden_size)`
         bias_hh_l[k]: the learnable hidden-hidden bias of the k-th layer, of shape `(hidden_size)`
@@ -155,7 +170,7 @@ class LSTM(RNNBase):
 
     where :math:`h_t` is the hidden state at time `t`, :math:`c_t` is the cell state at time `t`,
     :math:`x_t` is the hidden state of the previous layer at time `t` or :math:`input_t` for the first layer,
-    and :math:`i_t`, :math:`f_t`, :math:`g_t`, :math:`o_t` are the input, forget, 
+    and :math:`i_t`, :math:`f_t`, :math:`g_t`, :math:`o_t` are the input, forget,
     cell, and out gates, respectively.
 
     Args:
@@ -249,7 +264,19 @@ def __init__(self, *args, **kwargs):
         super(GRU, self).__init__('GRU', *args, **kwargs)
 
 
-class RNNCell(Module):
+class RNNCellBase(Module):
+
+    def __repr__(self):
+        s = '{name}({input_size}, {hidden_size}'
+        if 'bias' in self.__dict__ and self.bias != True:
+            s += ', bias={bias}}'
+        if 'nonlinearity' in self.__dict__ and self.nonlinearity != "tanh":
+            s += ', nonlinearity={nonlinearity}'
+        s += ')'
+        return s.format(name=self.__class__.__name__, **self.__dict__)
+
+
+class RNNCell(RNNCellBase):
     r"""An Elman RNN cell with tanh or ReLU non-linearity.
 
     .. math::
@@ -325,7 +352,7 @@ def forward(self, input, hx):
         )
 
 
-class LSTMCell(Module):
+class LSTMCell(RNNCellBase):
     r"""A long short-term memory (LSTM) cell.
 
     .. math::
@@ -399,7 +426,7 @@ def forward(self, input, hx):
         )
 
 
-class GRUCell(Module):
+class GRUCell(RNNCellBase):
     r"""A gated recurrent unit (GRU) cell
     .. math::
 
diff --git a/torch/nn/modules/sparse.py b/torch/nn/modules/sparse.py
@@ -21,7 +21,7 @@ class Embedding(Module):
 
     Attributes:
         weight (Tensor): the learnable weights of the module of shape (num_embeddings, embedding_dim)
-    
+
     Shape:
         - Input: LongTensor `(N, W)`, N = mini-batch, W = number of indices to extract per mini-batch
         - Output: `(N, W, embedding_dim)`
@@ -40,7 +40,7 @@ class Embedding(Module):
           0.8393 -0.6062 -0.3348
           0.6597  0.0350  0.0837
           0.5521  0.9447  0.0498
-        
+
         (1 ,.,.) =
           0.6597  0.0350  0.0837
          -0.1527  0.0877  0.4260
@@ -60,7 +60,7 @@ class Embedding(Module):
           0.0000  0.0000  0.0000
           0.0706 -2.1962 -0.6276
         [torch.FloatTensor of size 1x4x3]
-        
+
     """
     def __init__(self, num_embeddings, embedding_dim, padding_idx=None,
                  max_norm=None, norm_type=2, scale_grad_by_freq=False,
@@ -91,5 +91,20 @@ def forward(self, input):
             self.scale_grad_by_freq, self.sparse
             )(input, self.weight)
 
+    def __repr__(self):
+        s = '{name}({num_embeddings}, {embedding_dim}'
+        if self.padding_idx is not None:
+            s += ', padding_idx={padding_idx}'
+        if self.max_norm is not None:
+            s += ', max_norm={max_norm}'
+        if self.norm_type != 2:
+            s += ', norm_type={norm_type}'
+        if self.scale_grad_by_freq is not False:
+            s += ', scale_grad_by_freq={scale_grad_by_freq}'
+        if self.sparse is not False:
+            s += ', sparse=True'
+        s += ')'
+        return s.format(name=self.__class__.__name__, **self.__dict__)
+
 
 # TODO: SparseLinear