Merge pull request #137 from corochann/base_forward_model

mottodora · web-flow · commit dcda27f2fdbf · 2018-04-13T16:08:58.000+09:00
[refactor] Introduce BaseForwardModel
diff --git a/chainer_chemistry/models/prediction/__init__.py b/chainer_chemistry/models/prediction/__init__.py
@@ -1,5 +1,7 @@
+from chainer_chemistry.models.prediction import base  # NOQA
 from chainer_chemistry.models.prediction import classifier  # NOQA
 from chainer_chemistry.models.prediction import regressor  # NOQA
 
+from chainer_chemistry.models.prediction.base import BaseForwardModel  # NOQA
 from chainer_chemistry.models.prediction.classifier import Classifier  # NOQA
 from chainer_chemistry.models.prediction.regressor import Regressor  # NOQA
diff --git a/chainer_chemistry/models/prediction/base.py b/chainer_chemistry/models/prediction/base.py
@@ -0,0 +1,129 @@
+import chainer
+from chainer.dataset.convert import concat_examples
+from chainer import link, cuda
+from chainer.iterators import SerialIterator
+import numpy
+
+
+def _to_tuple(x):
+    if not isinstance(x, tuple):
+        x = (x,)
+    return x
+
+
+def _extract_numpy(x):
+    if isinstance(x, chainer.Variable):
+        x = x.data
+    return cuda.to_cpu(x)
+
+
+class BaseForwardModel(link.Chain):
+
+    """A base model which supports _forward functionality.
+
+    It also supports `device` id management.
+
+    Args:
+        device (int): GPU device id of this model to be used.
+            -1 indicates to use in CPU.
+
+    Attributes:
+        _device (int): Model's current device id
+
+    """
+
+    def __init__(self):
+        super(BaseForwardModel, self).__init__()
+
+        self.inputs = None
+        self._device = None
+
+    def get_device(self):
+        return self._device
+
+    def initialize(self, device=-1):
+        """Initialization of the model.
+
+        It must be executed **after** the link registration
+        (often done by `with self.init_scope()` finished.
+
+        Args:
+            device (int): GPU device id of this model to be used.
+            -1 indicates to use in CPU.
+
+        """
+        self.update_device(device=device)
+
+    def update_device(self, device=-1):
+        if self._device is None or self._device != device:
+            # reset current state
+            self.to_cpu()
+
+            # update the model to specified device id
+            self._device = device
+            if device >= 0:
+                chainer.cuda.get_device_from_id(device).use()
+                self.to_gpu()  # Copy the model to the GPU
+
+    def _forward(self, data, fn, batchsize=16,
+                 converter=concat_examples, retain_inputs=False,
+                 preprocess_fn=None, postprocess_fn=None):
+        """Forward data by iterating with batch
+
+        Args:
+            data: "train_x array" or "chainer dataset"
+            fn (Callable): Main function to forward. Its input argument is
+                either Variable, cupy.ndarray or numpy.ndarray, and returns
+                Variable.
+            batchsize (int): batch size
+            converter (Callable): convert from `data` to `inputs`
+            retain_inputs (bool): If True, this instance keeps inputs in 
+                `self.inputs` or not.
+            preprocess_fn (Callable): Its input is numpy.ndarray or 
+                cupy.ndarray, it can return either Variable, cupy.ndarray or
+                numpy.ndarray
+            postprocess_fn (Callable): Its input argument is Variable,
+                but this method may return either Variable, cupy.ndarray or
+                numpy.ndarray.
+
+        Returns (tuple or numpy.ndarray): forward result
+
+        """
+        input_list = None
+        output_list = None
+        it = SerialIterator(data, batch_size=batchsize, repeat=False,
+                            shuffle=False)
+        for batch in it:
+            inputs = converter(batch, self._device)
+            inputs = _to_tuple(inputs)
+
+            if preprocess_fn:
+                inputs = preprocess_fn(*inputs)
+                inputs = _to_tuple(inputs)
+
+            outputs = fn(*inputs)
+            outputs = _to_tuple(outputs)
+
+            # Init
+            if retain_inputs:
+                if input_list is None:
+                    input_list = [[] for _ in range(len(inputs))]
+                for j, input in enumerate(inputs):
+                    input_list[j].append(cuda.to_cpu(input))
+            if output_list is None:
+                output_list = [[] for _ in range(len(outputs))]
+
+            if postprocess_fn:
+                outputs = postprocess_fn(*outputs)
+                outputs = _to_tuple(outputs)
+            for j, output in enumerate(outputs):
+                output_list[j].append(_extract_numpy(output))
+
+        if retain_inputs:
+            self.inputs = [numpy.concatenate(in_array) for in_array in input_list]
+
+        result = [numpy.concatenate(output) for output in output_list]
+        if len(result) == 1:
+            return result[0]
+        else:
+            return result
diff --git a/chainer_chemistry/models/prediction/classifier.py b/chainer_chemistry/models/prediction/classifier.py
@@ -4,30 +4,17 @@
 from chainer.dataset.convert import concat_examples
 from chainer.functions.evaluation import accuracy
 from chainer.functions.loss import softmax_cross_entropy
-from chainer import link, cuda
 from chainer import reporter
-from chainer.iterators import SerialIterator
-import numpy
 
-
-def _to_tuple(x):
-    if not isinstance(x, tuple):
-        x = (x,)
-    return x
-
-
-def _extract_numpy(x):
-    if isinstance(x, chainer.Variable):
-        x = x.data
-    return cuda.to_cpu(x)
+from chainer_chemistry.models.prediction.base import BaseForwardModel
 
 
 def _argmax(*args):
     x = args[0]
     return chainer.functions.argmax(x, axis=1)
 
 
-class Classifier(link.Chain):
+class Classifier(BaseForwardModel):
 
     """A simple classifier model.
 
@@ -55,6 +42,15 @@ class Classifier(link.Chain):
         compute_metrics (bool): If ``True``, compute metrics on the forward
             computation. The default value is ``True``.
 
+    .. note::
+        The differences between original `Classifier` class in chainer and
+        chainer chemistry are as follows.
+        1. `predict` and `predict_proba` methods are supported.
+        2. `device` can be managed internally by the `Classifier`
+        3. `accfun` is deprecated, `metrics_fun` is used instead.
+        4. `metrics_fun` can be `dict` which specifies the metrics name as key
+           and function as value.
+
     .. note::
         This link uses :func:`chainer.softmax_cross_entropy` with
         default arguments as a loss function (specified by ``lossfun``),
@@ -111,10 +107,8 @@ def __init__(self, predictor,
         with self.init_scope():
             self.predictor = predictor
 
-        self.device = device
-        if device >= 0:
-            chainer.cuda.get_device_from_id(device).use()
-            self.to_gpu()  # Copy the model to the GPU
+        # `initialize` must be called after `init_scope`.
+        self.initialize(device)
 
     def __call__(self, *args, **kwargs):
         """Computes the loss value for an input and label pair.
@@ -172,69 +166,6 @@ def __call__(self, *args, **kwargs):
             reporter.report(self.metrics, self)
         return self.loss
 
-    def _forward(self, data, fn, batchsize=16,
-                 converter=concat_examples, retain_inputs=False,
-                 preprocess_fn=None, postprocess_fn=None):
-        """Forward data by iterating with batch
-
-        Args:
-            data: "train_x array" or "chainer dataset"
-            fn (Callable): Main function to forward. Its input argument is
-                either Variable, cupy.ndarray or numpy.ndarray, and returns
-                Variable.
-            batchsize (int): batch size
-            converter (Callable): convert from `data` to `inputs`
-            retain_inputs (bool): If True, this instance keeps inputs in 
-                `self.inputs` or not.
-            preprocess_fn (Callable): Its input is numpy.ndarray or 
-                cupy.ndarray, it can return either Variable, cupy.ndarray or
-                numpy.ndarray
-            postprocess_fn (Callable): Its input argument is Variable,
-                but this method may return either Variable, cupy.ndarray or
-                numpy.ndarray.
-
-        Returns (tuple or numpy.ndarray): forward result
-
-        """
-        input_list = None
-        output_list = None
-        it = SerialIterator(data, batch_size=batchsize, repeat=False,
-                            shuffle=False)
-        for batch in it:
-            inputs = converter(batch, self.device)
-            inputs = _to_tuple(inputs)
-
-            if preprocess_fn:
-                inputs = preprocess_fn(*inputs)
-                inputs = _to_tuple(inputs)
-
-            outputs = fn(*inputs)
-            outputs = _to_tuple(outputs)
-
-            # Init
-            if retain_inputs:
-                if input_list is None:
-                    input_list = [[] for _ in range(len(inputs))]
-                for j, input in enumerate(inputs):
-                    input_list[j].append(cuda.to_cpu(input))
-            if output_list is None:
-                output_list = [[] for _ in range(len(outputs))]
-
-            if postprocess_fn:
-                outputs = postprocess_fn(*outputs)
-                outputs = _to_tuple(outputs)
-            for j, output in enumerate(outputs):
-                output_list[j].append(_extract_numpy(output))
-
-        if retain_inputs:
-            self.inputs = [numpy.concatenate(in_array) for in_array in input_list]
-
-        result = [numpy.concatenate(output) for output in output_list]
-        if len(result) == 1:
-            return result[0]
-        else:
-            return result
-
     def predict_proba(
             self, data, batchsize=16, converter=concat_examples,
             retain_inputs=False, preprocess_fn=None,
diff --git a/chainer_chemistry/models/prediction/regressor.py b/chainer_chemistry/models/prediction/regressor.py
@@ -1,29 +1,11 @@
 import chainer
 from chainer.dataset.convert import concat_examples
-from chainer import link, cuda
 from chainer import reporter
-from chainer.iterators import SerialIterator
-import numpy
 
+from chainer_chemistry.models.prediction.base import BaseForwardModel
 
-def _to_tuple(x):
-    if not isinstance(x, tuple):
-        x = (x,)
-    return x
 
-
-def _extract_numpy(x):
-    if isinstance(x, chainer.Variable):
-        x = x.data
-    return cuda.to_cpu(x)
-
-
-def _argmax(*args):
-    x = args[0]
-    return chainer.functions.argmax(x, axis=1)
-
-
-class Regressor(link.Chain):
+class Regressor(BaseForwardModel):
 
     """A simple regressor model.
 
@@ -37,7 +19,7 @@ class Regressor(link.Chain):
         label_key (int or str): Key to specify label variable from arguments.
             When it is ``int``, a variable in positional arguments is used.
             And when it is ``str``, a variable in keyword arguments is used.
-        device (int): GPU device id of this Classifier to be used.
+        device (int): GPU device id of this Regressor to be used.
             -1 indicates to use in CPU.
 
     Attributes:
@@ -80,10 +62,8 @@ def __init__(self, predictor,
         with self.init_scope():
             self.predictor = predictor
 
-        self.device = device
-        if device >= 0:
-            chainer.cuda.get_device_from_id(device).use()
-            self.to_gpu()  # Copy the model to the GPU
+        # `initialize` must be called after `init_scope`.
+        self.initialize(device)
 
     def __call__(self, *args, **kwargs):
         """Computes the loss value for an input and label pair.
@@ -142,69 +122,6 @@ def __call__(self, *args, **kwargs):
             reporter.report(self.metrics, self)
         return self.loss
 
-    def _forward(self, data, fn, batchsize=16,
-                 converter=concat_examples, retain_inputs=False,
-                 preprocess_fn=None, postprocess_fn=None):
-        """Forward data by iterating with batch
-
-        Args:
-            data: "train_x array" or "chainer dataset"
-            fn (Callable): Main function to forward. Its input argument is
-                either Variable, cupy.ndarray or numpy.ndarray, and returns
-                Variable.
-            batchsize (int): batch size
-            converter (Callable): convert from `data` to `inputs`
-            retain_inputs (bool): If True, this instance keeps inputs in 
-                `self.inputs` or not.
-            preprocess_fn (Callable): Its input is numpy.ndarray or 
-                cupy.ndarray, it can return either Variable, cupy.ndarray or
-                numpy.ndarray
-            postprocess_fn (Callable): Its input argument is Variable,
-                but this method may return either Variable, cupy.ndarray or
-                numpy.ndarray.
-
-        Returns (tuple or numpy.ndarray): forward result
-
-        """
-        input_list = None
-        output_list = None
-        it = SerialIterator(data, batch_size=batchsize, repeat=False,
-                            shuffle=False)
-        for batch in it:
-            inputs = converter(batch, self.device)
-            inputs = _to_tuple(inputs)
-
-            if preprocess_fn:
-                inputs = preprocess_fn(*inputs)
-                inputs = _to_tuple(inputs)
-
-            outputs = fn(*inputs)
-            outputs = _to_tuple(outputs)
-
-            # Init
-            if retain_inputs:
-                if input_list is None:
-                    input_list = [[] for _ in range(len(inputs))]
-                for j, input in enumerate(inputs):
-                    input_list[j].append(cuda.to_cpu(input))
-            if output_list is None:
-                output_list = [[] for _ in range(len(outputs))]
-
-            if postprocess_fn:
-                outputs = postprocess_fn(*outputs)
-                outputs = _to_tuple(outputs)
-            for j, output in enumerate(outputs):
-                output_list[j].append(_extract_numpy(output))
-
-        if retain_inputs:
-            self.inputs = [numpy.concatenate(in_array) for in_array in input_list]
-
-        result = [numpy.concatenate(output) for output in output_list]
-        if len(result) == 1:
-            return result[0]
-        else:
-            return result
-
     def predict(
             self, data, batchsize=16, converter=concat_examples,
             retain_inputs=False, preprocess_fn=None, postprocess_fn=None):