docs update

anhaidgroup · Apr 18, 2018 · 584cd22 · 584cd22
1 parent 4df4e84
commit 584cd22
Show file tree

Hide file tree

Showing 28 changed files with 450 additions and 250 deletions.
diff --git a/.gitignore b/.gitignore
@@ -1,3 +1,5 @@
 *.pyc
+*.pth
 deepmatcher.egg-info/*
 examples/.ipynb_checkpoints/*
+docs/build
diff --git a/deepmatcher/__init__.py b/deepmatcher/__init__.py
@@ -1,16 +1,19 @@
+r"""
+The deepmatcher package contains high level modules used in the construction of deep
+learning modules for entity matching. It also contains data processing utilities.
+"""
+
 from .data import process
-from .optim import Optimizer
-from .runner import Statistics
 from .models import modules
 from .models.core import (MatchingModel, AttrSummarizer, AttrComparator,
                           WordContextualizer, WordComparator, WordAggregator, Classifier)
 from .models import (attr_summarizers, word_aggregators, word_comparators,
                      word_contextualizers)
 
 __all__ = [
-    attr_summarizers, word_aggregators, word_comparators,
-    word_contextualizers, process, Optimizer, Statistics, MatchingModel, AttrSummarizer,
-    AttrComparator, WordContextualizer, WordComparator, WordAggregator, Classifier, modules
+    attr_summarizers, word_aggregators, word_comparators, word_contextualizers, process,
+    MatchingModel, AttrSummarizer, AttrComparator, WordContextualizer,
+    WordComparator, WordAggregator, Classifier, modules
 ]
 
 _check_nan = True

diff --git a/deepmatcher/batch.py b/deepmatcher/batch.py
@@ -40,7 +40,7 @@ def from_old_metadata(data, old_attrtensor):
         return AttrTensor(data, *old_attrtensor[1:])
 
 
-class Batch(object):
+class MatchingBatch(object):
 
     def __init__(self, input, train_dataset):
         copy_fields = train_dataset.all_text_fields

diff --git a/deepmatcher/config.py b/deepmatcher/config.py
diff --git a/deepmatcher/data/iterator.py b/deepmatcher/data/iterator.py
@@ -4,7 +4,7 @@
 
 from torchtext import data
 
-from ..batch import Batch
+from ..batch import MatchingBatch
 
 logger = logging.getLogger(__name__)
 
@@ -44,7 +44,7 @@ def splits(cls, datasets, batch_sizes=None, **kwargs):
 
     def __iter__(self):
         for batch in super(MatchingIterator, self).__iter__():
-            yield Batch(batch, self.train_dataset)
+            yield MatchingBatch(batch, self.train_dataset)
 
     def create_batches(self):
         if self.sort_in_buckets:

diff --git a/deepmatcher/loss.py b/deepmatcher/loss.py
diff --git a/deepmatcher/models/attr_summarizers.py b/deepmatcher/models/attr_summarizers.py
@@ -2,24 +2,28 @@
 
 
 class SIF(dm.AttrSummarizer):
-    r"""The attribute summarizer for the SIF (Smooth Inverse Frequency) model.
+    """__init__(word_contextualizer=None, word_comparator=None, word_aggregator=None, \
+        hidden_size=None)
+
+    The attribute summarizer for the SIF (Smooth Inverse Frequency) model.
 
     Args:
-    word_contextualizer (string or :class:`~dm.WordContextualizer` or callable): The word
-        contextualizer module (refer to :class:`~dm.WordContextualizer` for details) to
-        use for attribute summarization. The SIF model does not take word context
-        information into account, hence this defaults to None.
-    word_comparator (string or :class:`~dm.WordComparator` or callable): The word
-        comparator module (refer to :class:`~dm.WordComparator` for details) to use for
-        attribute summarization. The SIF model does not perform word by word comparisons,
-        hence this defaults to None.
-    word_aggregator (string or :class:`~dm.WordAggregator` or callable): The word
-        aggregator module (refer to :class:`~dm.WordAggregator` for details) to use for
-        attribute summarization. This model uses SIF-based weighted average aggregation
-        over the  word embeddings of an input sequence, hence this defaults to 'sif-pool'.
-    hidden_size (int): The hidden size to use for all 3 attribute summarization
-        sub-modules (i.e., word contextualizer, word comparator, and word aggregator),
-        if they are customized. By default, the SIF model does not use this parameter.
+        word_contextualizer (string or :class:`~dm.WordContextualizer` or callable): The
+            word contextualizer module (refer to :class:`~dm.WordContextualizer` for
+            details) to use for attribute summarization. The SIF model does not take word
+            context information into account, hence this defaults to None.
+        word_comparator (string or :class:`~dm.WordComparator` or callable): The word
+            comparator module (refer to :class:`~dm.WordComparator` for details) to use
+            for attribute summarization. The SIF model does not perform word by word
+            comparisons, hence this defaults to None.
+        word_aggregator (string or :class:`~dm.WordAggregator` or callable): The word
+            aggregator module (refer to :class:`~dm.WordAggregator` for details) to use
+            for attribute summarization. This model uses SIF-based weighted average
+            aggregation over the  word embeddings of an input sequence, hence this
+            defaults to 'sif-pool'.
+        hidden_size (int): The hidden size to use for all 3 attribute summarization
+            sub-modules (i.e., word contextualizer, word comparator, and word aggregator),
+            if they are customized. By default, the SIF model does not use this parameter.
     """
 
     def _init(self,
@@ -39,27 +43,27 @@ class RNN(dm.AttrSummarizer):
     r"""The attribute summarizer for the RNN model.
 
     Args:
-    word_contextualizer (string or :class:`~dm.WordContextualizer` or callable): The word
-        contextualizer module (refer to :class:`~dm.WordContextualizer` for details) to
-        use for attribute summarization. This model uses RNN to take into account the
-        context information, and the default value is 'gru' (i.e., uses the bidirectional
-        GRU model as the specific RNN instantiation.) Other options are 'rnn' (the vanilla
-        bi-RNN) and 'lstm' (the bi-LSTM model).
-    word_comparator (string or :class:`~dm.WordComparator` or callable): The word
-        comparator module (refer to :class:`~dm.WordComparator` for details) to use for
-        attribute summarization. The RNN model does not perform word by word comparisons,
-        hence this defaults to None.
-    word_aggregator (string or :class:`~dm.WordAggregator` or callable): The word
-        aggregator module (refer to :class:`~dm.WordAggregator` for details) to use for
-        attribute summarization. The RNN model uses bi-directional RNN and concatenates
-        the last ouputs of the forward and backward RNNs, hence the default value is
-        'birnn-last-pool'.
-    hidden_size (int): The hidden size to use for the word contextualizer. This value
-        will also be used as the hidden size for the other 2 attribute summarization
-        sub-modules (i.e., word comparator, and word aggregator), if they are customized.
-        If not specified, the hidden size for each component will be set to be the same as
-        its input size. E.g. if the word embedding dimension is 300 and hidden_size is
-        None, the word contextualizer's hidden size will be 300.
+        word_contextualizer (string or :class:`~dm.WordContextualizer` or callable): The
+            word contextualizer module (refer to :class:`~dm.WordContextualizer` for
+            details) to use for attribute summarization. This model uses RNN to take into
+            account the context information, and the default value is 'gru' (i.e., uses
+            the bidirectional GRU model as the specific RNN instantiation.) Other options
+            are 'rnn' (the vanilla bi-RNN) and 'lstm' (the bi-LSTM model).
+        word_comparator (string or :class:`~dm.WordComparator` or callable): The word
+            comparator module (refer to :class:`~dm.WordComparator` for details) to use
+            for attribute summarization. The RNN model does not perform word by word
+            comparisons, hence this defaults to None.
+        word_aggregator (string or :class:`~dm.WordAggregator` or callable): The word
+            aggregator module (refer to :class:`~dm.WordAggregator` for details) to use
+            for attribute summarization. The RNN model uses bi-directional RNN and
+            concatenates the last ouputs of the forward and backward RNNs, hence the
+            default value is 'birnn-last-pool'.
+        hidden_size (int): The hidden size to use for the word contextualizer. This value
+            will also be used as the hidden size for the other 2 attribute summarization
+            sub-modules (i.e., word comparator, and word aggregator), if they are
+            customized. If not specified, the hidden size for each component will be set
+            to be the same as its input size. E.g. if the word embedding dimension is 300
+            and hidden_size is None, the word contextualizer's hidden size will be 300.
     """
 
     def _init(self,
@@ -77,31 +81,30 @@ def _init(self,
 
 
 class Attention(dm.AttrSummarizer):
-
     r"""The attribute summarizer for the attention-based model.
 
     Args:
-    word_contextualizer (string or :class:`~dm.WordContextualizer` or callable): The word
-        contextualizer module (refer to :class:`~dm.WordContextualizer` for details) to
-        use for attribute summarization. The attention model does not take word context
-        information into account, hence this defaults to None.
-    word_comparator (string or :class:`~dm.WordComparator` or callable): The word
-        comparator module (refer to :class:`~dm.WordComparator` for details) to use for
-        attribute summarization. The attention model performs word by word comparison with
-        the decomposable attention mechanism, hence this defaults to
-        'decomposable-attention'.
-    word_aggregator (string or :class:`~dm.WordAggregator` or callable): The word
-        aggregator module (refer to :class:`~dm.WordAggregator` for details) to use for
-        attribute summarization. The Attention model performs the aggregation by summing
-        over the comparison results from the word comparator, divided by the length of
-        the input sequence (to get constant variance through the network flow). Hence
-        this defaults to 'divsqrt-pool'.
-    hidden_size (int): The hidden size to use for the word comparator. This value
-    will also be used as the hidden size for the other 2 attribute summarization
-    sub-modules (i.e., word contextualizer, and word aggregator), if they are customized.
-    If not specified, the hidden size for each component will be set to be the same as
-    its input size. E.g. if the word embedding dimension is 300 and hidden_size is
-    None, the word contextualizer's hidden size will be 300.
+        word_contextualizer (string or :class:`~dm.WordContextualizer` or callable): The
+            word contextualizer module (refer to :class:`~dm.WordContextualizer` for
+            details) to use for attribute summarization. The attention model does not take
+            word context information into account, hence this defaults to None.
+        word_comparator (string or :class:`~dm.WordComparator` or callable): The word
+            comparator module (refer to :class:`~dm.WordComparator` for details) to use
+            for attribute summarization. The attention model performs word by word
+            comparison with the decomposable attention mechanism, hence this defaults to
+            'decomposable-attention'.
+        word_aggregator (string or :class:`~dm.WordAggregator` or callable): The word
+            aggregator module (refer to :class:`~dm.WordAggregator` for details) to use
+            for attribute summarization. The Attention model performs the aggregation by
+            summing over the comparison results from the word comparator, divided by the
+            length of the input sequence (to get constant variance through the network
+            flow). Hence this defaults to 'divsqrt-pool'.
+        hidden_size (int): The hidden size to use for the word comparator. This value
+            will also be used as the hidden size for the other 2 attribute summarization
+            sub-modules (i.e., word contextualizer, and word aggregator), if they are
+            customized. If not specified, the hidden size for each component will be set
+            to be the same as its input size. E.g. if the word embedding dimension is 300
+            and hidden_size is None, the word contextualizer's hidden size will be 300.
     """
 
     def _init(self,
@@ -119,29 +122,28 @@ def _init(self,
 
 
 class Hybrid(dm.AttrSummarizer):
-
     r"""The attribute summarizer for the hybrid model.
 
     Args:
-    word_contextualizer (string or :class:`~dm.WordContextualizer` or callable): The word
-        contextualizer module (refer to :class:`~dm.WordContextualizer` for details) to
-        use for attribute summarization. The hybrid model uses bidirectional GRU(a
-        specific type of RNN) to take into account the context information. The default
-        value is 'gru'.
-    word_comparator (string or :class:`~dm.WordComparator` or callable): The word
-        comparator module (refer to :class:`~dm.WordComparator` for details) to use for
-        attribute summarization. The hybrid model performs word by word comparison over
-        the raw input word embeddings (rather than the RNN hiddens states), hence this
-        defaults to an Attention object with 'decomposable' as the attention mechanism
-        on the raw input embeddings.
-    word_aggregator (string or :class:`~dm.WordAggregator` or callable): The word
-        aggregator module (refer to :class:`~dm.WordAggregator` for details) to use for
-        attribute summarization. A second layer of attention has been used for the
-        aggregation. Please consult the paper for more information. The default value is
-        'concat-attention-with-rnn'.
-    hidden_size (int): The hidden size to use for all 3 attribute summarization
-        sub-modules (i.e., word contextualizer, word comparator, and word aggregator),
-        if they are customized.
+        word_contextualizer (string or :class:`~dm.WordContextualizer` or callable): The
+            word contextualizer module (refer to :class:`~dm.WordContextualizer` for
+            details) to use for attribute summarization. The hybrid model uses
+            bidirectional GRU(a specific type of RNN) to take into account the context
+            information. The default value is 'gru'.
+        word_comparator (string or :class:`~dm.WordComparator` or callable): The word
+            comparator module (refer to :class:`~dm.WordComparator` for details) to use
+            for attribute summarization. The hybrid model performs word by word comparison
+            over the raw input word embeddings (rather than the RNN hiddens states), hence
+            this defaults to an Attention object with 'decomposable' as the attention
+            mechanism on the raw input embeddings.
+        word_aggregator (string or :class:`~dm.WordAggregator` or callable): The word
+            aggregator module (refer to :class:`~dm.WordAggregator` for details) to use
+            for attribute summarization. A second layer of attention has been used for the
+            aggregation. Please consult the paper for more information. The default value
+            is 'concat-attention-with-rnn'.
+        hidden_size (int): The hidden size to use for all 3 attribute summarization
+            sub-modules (i.e., word contextualizer, word comparator, and word aggregator),
+            if they are customized.
     """
 
     def _init(self,