PaddlePaddle · jacquesqiao · Jan 11, 2017 · Jan 11, 2017 · Jan 11, 2017 · Jan 11, 2017
diff --git a/demo/image_classification/api_train.py b/demo/image_classification/api_train.py
@@ -0,0 +1,198 @@
+# Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+An example to show how to use current Raw SWIG API to train cifar-10 network.
+
+Current implementation uses Raw SWIG, which means the API call is directly \
+passed to C++ side of Paddle.
+
+The user api should be simpler and carefully designed.
+"""
+import numpy as np
+import paddle.trainer_config_helpers as config_helpers
+import py_paddle.swig_paddle as swig_api
+
+import cifar_util
+
+# some global parameter.
+IMAGE_SIZE = 32
+DATA_SIZE = 3 * IMAGE_SIZE * IMAGE_SIZE
+LABEL_SIZE = 10
+
+
+def optimizer_config():
+    """Function to config optimizer."""
+    config_helpers.optimizers.settings(
+        batch_size=128,
+        learning_rate=0.1 / 128.0,
+        learning_method=config_helpers.optimizers.MomentumOptimizer(0.9),
+        regularization=config_helpers.optimizers.L2Regularization(0.0005 * 128))
+
+
+def network_config():
+    """Function to config neural network."""
+    img = config_helpers.layers.data_layer(name='image', size=DATA_SIZE)
+    lbl = config_helpers.layers.data_layer(name='label', size=LABEL_SIZE)
+    hidden1 = config_helpers.layers.fc_layer(input=img, size=200)
+    hidden2 = config_helpers.layers.fc_layer(input=hidden1, size=200)
+    inference = config_helpers.layers.fc_layer(
+        input=hidden2,
+        size=10,
+        act=config_helpers.activations.SoftmaxActivation())
+    cost = config_helpers.layers.classification_cost(input=inference, label=lbl)
+    config_helpers.networks.outputs(cost)
+
+
+def init_parameter(gradient_machine):
+    """Function to init parameter inside gradient machine"""
+    assert isinstance(gradient_machine, swig_api.GradientMachine)
+    for each_param in gradient_machine.getParameters():
+        assert isinstance(each_param, swig_api.Parameter)
+        array_size = len(each_param)
+        array = np.random.uniform(-1.0, 1.0, array_size).astype('float32')
+        each_param.getBuf(swig_api.PARAMETER_VALUE).copyFromNumpyArray(array)
+
+
+def main():
+    swig_api.initPaddle("-use_gpu=false", "-trainer_count=4")  # use 4 cpu cores
+
+    # prepare cifar-10 data.
+    cifar_data = cifar_util.Cifar10Data(
+        img_size=IMAGE_SIZE,
+        mean_img_size=IMAGE_SIZE,
+        num_classes=LABEL_SIZE,
+        batch_size=128,
+        train_file_list='data/cifar-out/batches/train.txt',
+        test_file_list='data/cifar-out/batches/test.txt',
+        meta='data/cifar-out/batches/batches.meta')
+
+    # get enable_types for each optimizer.
+    # enable_types = [value, gradient, momentum, etc]
+    # For each optimizer(SGD, Adam), GradientMachine should enable different
+    # buffers.
+    opt_config_proto = config_helpers.config_parser_utils.parse_optimizer_config(
+        optimizer_config)
+    opt_config = swig_api.OptimizationConfig.createFromProto(opt_config_proto)
+    _temp_optimizer_ = swig_api.ParameterOptimizer.create(opt_config)
+    enable_types = _temp_optimizer_.getParameterTypes()
+
+    # Create Simple Gradient Machine.
+    model_config = config_helpers.config_parser_utils.parse_network_config(
+        network_config)
+    gradient_machine = swig_api.GradientMachine.createFromConfigProto(
+        model_config, swig_api.CREATE_MODE_NORMAL, enable_types)
+
+    # This type check is not useful. Only enable type hint in IDE.
+    # Such as PyCharm
+    assert isinstance(gradient_machine, swig_api.GradientMachine)
+
+    # Initialize Parameter by numpy.
+    init_parameter(gradient_machine=gradient_machine)
+
+    # Create Local Updater. Local means not run in cluster.
+    # For a cluster training, here we can change to createRemoteUpdater
+    # in future.
+    updater = swig_api.ParameterUpdater.createLocalUpdater(opt_config)
+    assert isinstance(updater, swig_api.ParameterUpdater)
+
+    # Initialize ParameterUpdater.
+    updater.init(gradient_machine)
+
+    # start gradient machine.
+    # the gradient machine must be started before invoke forward/backward.
+    # not just for training, but also for inference.
+    gradient_machine.start()
+
+    # evaluator can print error rate, etc. It is a C++ class.
+    batch_evaluator = gradient_machine.makeEvaluator()
+    test_evaluator = gradient_machine.makeEvaluator()
+
+    # output_arguments is Neural Network forward result. Here is not useful, just passed
+    # to gradient_machine.forward
+    output_arguments = swig_api.Arguments.createArguments(0)
+
+    for pass_id in xrange(3):  # we train 2 passes.
+        updater.startPass()
+
+        for batch_id, data_batch in enumerate(cifar_data.train_data()()):
+            # data_batch is input images.
+            # here, for online learning, we could get data_batch from network.
+
+            # Start update one batch.
+            pass_type = updater.startBatch(len(data_batch))
+
+            # Start BatchEvaluator.
+            # batch_evaluator can be used between start/finish.
+            batch_evaluator.start()
+
+            # forwardBackward is a shortcut for forward and backward.
+            # It is sometimes faster than invoke forward/backward separately,
+            # because in GradientMachine, it may be async.
+            gradient_machine.forwardBackward(
+                cifar_data.data_converter.convert(data_batch), output_arguments,
+                pass_type)
+
+            for each_param in gradient_machine.getParameters():
+                updater.update(each_param)
+
+            # Get cost. We use numpy to calculate total cost for this batch.
+            cost_vec = output_arguments.getSlotValue(0)
+            cost_vec = cost_vec.copyToNumpyMat()
+            cost = cost_vec.sum() / len(data_batch)
+
+            # Make evaluator works.
+            gradient_machine.eval(batch_evaluator)
+
+            # Print logs.
+            print 'Pass id', pass_id, 'Batch id', batch_id, 'with cost=', \
+                cost, batch_evaluator
+
+            batch_evaluator.finish()
+            # Finish batch.
+            #  * will clear gradient.
+            #  * ensure all values should be updated.
+            updater.finishBatch(cost)
+
+        # testing stage. use test data set to test current network.
+        updater.apply()
+        test_evaluator.start()
+        for data_batch in cifar_data.test_data():
+            # in testing stage, only forward is needed.
+            gradient_machine.forward(
+                cifar_data.data_converter.convert(data_batch), output_arguments,
+                swig_api.PASS_TEST)
+            gradient_machine.eval(test_evaluator)
+
+        # print error rate for test data set
+        print 'Pass', pass_id, ' test evaluator: ', test_evaluator
+        test_evaluator.finish()
+        updater.restore()
+
+        updater.catchUpWith()
+        params = gradient_machine.getParameters()
+        for each_param in params:
+            assert isinstance(each_param, swig_api.Parameter)
+            value = each_param.getBuf(swig_api.PARAMETER_VALUE)
+            value = value.copyToNumpyArray()
+
+            # Here, we could save parameter to every where you want
+            print each_param.getName(), value
+
+        updater.finishPass()
+
+    gradient_machine.finish()
+
+
+if __name__ == '__main__':
+    main()
diff --git a/demo/image_classification/cifar_util.py b/demo/image_classification/cifar_util.py
@@ -0,0 +1,155 @@
+# Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+Some class for prepare cifar-10 image data.
+"""
+import io
+import random
+
+import paddle.trainer.PyDataProvider2 as data_provider
+import paddle.utils.image_util as image_util
+from paddle.trainer.PyDataProvider2 import *
+from py_paddle import DataProviderConverter
+
+
+class BatchPool(object):
+    """A class to get all data in memory and do data shuffle."""
+
+    def __init__(self, generator, batch_size):
+        self.data = list(generator)
+        self.batch_size = batch_size
+
+    def __call__(self):
+        random.shuffle(self.data)
+        for offset in xrange(0, len(self.data), self.batch_size):
+            limit = min(offset + self.batch_size, len(self.data))
+            yield self.data[offset:limit]
+
+
+class Cifar10Data(object):
+    """
+    Class to prepare cifar-10 data, have all the message to read and convert
+    image data to the data the can send to paddle to train or test.
+    """
+
+    def __init__(self,
+                 meta,
+                 train_file_list,
+                 test_file_list,
+                 batch_size,
+                 img_size=32,
+                 mean_img_size=32,
+                 num_classes=10,
+                 is_color=True,
+                 use_jpeg=True):
+        self.mean_img_size = mean_img_size
+        self.img_size = img_size
+        self.num_classes = num_classes
+        self.train_file_list = train_file_list
+        self.test_file_list = test_file_list
+        self.is_color = is_color
+        if self.is_color:
+            self.img_raw_size = self.img_size * self.img_size * 3
+        else:
+            self.img_raw_size = self.img_size * self.img_size
+        self.meta_path = meta
+        self.use_jpeg = use_jpeg
+        self.batch_size = batch_size
+        self.img_mean = image_util.load_meta(self.meta_path, self.mean_img_size,
+                                             self.img_size, self.is_color)
+
+        # DataProvider Converter is a utility convert Python Object to Paddle C++
+        # Input. The input format is as same as Paddle's DataProvider.
+        # input_types = {
+        #     'image': dp.dense_vector(data_size),
+        #              'label': dp.integer_value(label_size)
+        # }
+        input_types = [
+            data_provider.dense_vector(self.img_raw_size),
+            data_provider.integer_value(self.num_classes)
+        ]
+        self.data_converter = DataProviderConverter(input_types)
+
+    @staticmethod
+    def _input_order_converter(generator):
+        for item in generator:
+            yield item['image'], item['label']
+
+    @staticmethod
+    def generator_to_batch(generator, batch_size):
+        ret_val = list()
+        for each_item in generator:
+            ret_val.append(each_item)
+            if len(ret_val) == batch_size:
+                yield ret_val
+                ret_val = list()
+        if len(ret_val) != 0:
+            yield ret_val
+
+    def _read_data(self, is_train):
+        """
+        The main function for loading data.
+        Load the batch, iterate all the images and labels in this batch.
+        file_list: the batch file list.
+        """
+        if is_train:
+            file_list = self.train_file_list
+        else:
+            file_list = self.test_file_list
+
+        with open(file_list, 'r') as fdata:
+            lines = [line.strip() for line in fdata]
+            random.shuffle(lines)
+            for file_name in lines:
+                with io.open(file_name.strip(), 'rb') as file:
+                    data = cPickle.load(file)
+                    indexes = list(range(len(data['images'])))
+                    if is_train:
+                        random.shuffle(indexes)
+                    for i in indexes:
+                        if self.use_jpeg == 1:
+                            img = image_util.decode_jpeg(data['images'][i])
+                        else:
+                            img = data['images'][i]
+                        img_feat = image_util.preprocess_img(
+                            img, self.img_mean, self.img_size, is_train,
+                            self.is_color)
+                        label = data['labels'][i]
+                        yield {
+                            'image': img_feat.astype('float32'),
+                            'label': int(label)
+                        }
+
+    def train_data(self):
+        """
+        Get Train Data.
+        TrainData will stored in a data pool. Currently implementation is not care
+        about memory, speed. Just a very naive implementation.
+        """
+        train_data_generator = self._input_order_converter(
+            self._read_data(True))
+        train_data = BatchPool(train_data_generator, self.batch_size)
+        return train_data
+
+    def test_data(self):
+        """
+        Get Test Data.
+        TrainData will stored in a data pool. Currently implementation is not care
+        about memory, speed. Just a very naive implementation.
+        """
+        test_data_generator = self._input_order_converter(
+            self._read_data(False))
+        test_data = self.generator_to_batch(test_data_generator,
+                                            self.batch_size)
+        return test_data