Merge branch 'develop' of https://github.com/PaddlePaddle/Paddle into transpiler_split_tensor

8 years ago · df50c14abd
parent 06b326b681 04bfed660b
commit df50c14abd
308 changed files with 9950 additions and 1974 deletions
--- a/adversarial/README.md
+++ b/adversarial/README.md
@ -0,0 +1,9 @@
 # Advbox
 Advbox is a Python toolbox to create adversarial examples that fool neural networks. It requires Python and paddle.
 ## How to use
 1. train a model and save it's parameters. (like fluid_mnist.py)
 2. load the parameters which is trained in step1, then reconstruct the model.(like mnist_tutorial_fgsm.py)
 3. use advbox to generate the adversarial sample.
--- a/adversarial/advbox/init.py
+++ b/adversarial/advbox/init.py
@ -0,0 +1,16 @@
 # Copyright (c) 2017 PaddlePaddle Authors. All Rights Reserved
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """
   A set of tools for generating adversarial example on paddle platform 
 """
--- a/adversarial/advbox/attacks/base.py
+++ b/adversarial/advbox/attacks/base.py
@ -0,0 +1,39 @@
 """
 The base model of the model.
 """
 from abc import ABCMeta, abstractmethod
 class Attack(object):
    """
    Abstract base class for adversarial attacks. `Attack` represent an adversarial attack
    which search an adversarial example. subclass should implement the _apply() method.
    Args:
        model(Model): an instance of the class advbox.base.Model.
    """
    __metaclass__ = ABCMeta
    def __init__(self, model):
        self.model = model
    def __call__(self, image_label):
        """
        Generate the adversarial sample.
        Args:
        image_label(list): The image and label tuple list with one element.
        """
        adv_img = self._apply(image_label)
        return adv_img
    @abstractmethod
    def _apply(self, image_label):
        """
        Search an adversarial example.
        Args:
        image_batch(list): The image and label tuple list with one element.
        """
        raise NotImplementedError
--- a/adversarial/advbox/attacks/gradientsign.py
+++ b/adversarial/advbox/attacks/gradientsign.py
@ -0,0 +1,38 @@
 """
 This module provide the attack method for FGSM's implement.
 """
 from __future__ import division
 import numpy as np
 from collections import Iterable
 from .base import Attack
 class GradientSignAttack(Attack):
    """
    This attack was originally implemented by Goodfellow et al. (2015) with the
    infinity norm (and is known as the "Fast Gradient Sign Method"). This is therefore called
    the Fast Gradient Method.
    Paper link: https://arxiv.org/abs/1412.6572
    """
    def _apply(self, image_label, epsilons=1000):
        assert len(image_label) == 1
        pre_label = np.argmax(self.model.predict(image_label))
        min_, max_ = self.model.bounds()
        gradient = self.model.gradient(image_label)
        gradient_sign = np.sign(gradient) * (max_ - min_)
        if not isinstance(epsilons, Iterable):
            epsilons = np.linspace(0, 1, num=epsilons + 1)
        for epsilon in epsilons:
            adv_img = image_label[0][0].reshape(
                gradient_sign.shape) + epsilon * gradient_sign
            adv_img = np.clip(adv_img, min_, max_)
            adv_label = np.argmax(self.model.predict([(adv_img, 0)]))
            if pre_label != adv_label:
                return adv_img
 FGSM = GradientSignAttack
--- a/adversarial/advbox/models/init.py
+++ b/adversarial/advbox/models/init.py
@ -0,0 +1,16 @@
 # Copyright (c) 2017 PaddlePaddle Authors. All Rights Reserved
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """
 Paddle model for target of attack 
 """
--- a/adversarial/advbox/models/base.py
+++ b/adversarial/advbox/models/base.py
@ -0,0 +1,90 @@
 """
 The base model of the model.
 """
 from abc import ABCMeta
 import abc
 abstractmethod = abc.abstractmethod
 class Model(object):
    """
    Base class of model to provide attack.
    Args:
        bounds(tuple): The lower and upper bound for the image pixel.
        channel_axis(int): The index of the axis that represents the color channel.
        preprocess(tuple): Two element tuple used to preprocess the input. First
            substract the first element, then divide the second element.
    """
    __metaclass__ = ABCMeta
    def __init__(self, bounds, channel_axis, preprocess=None):
        assert len(bounds) == 2
        assert channel_axis in [0, 1, 2, 3]
        if preprocess is None:
            preprocess = (0, 1)
        self._bounds = bounds
        self._channel_axis = channel_axis
        self._preprocess = preprocess
    def bounds(self):
        """
        Return the upper and lower bounds of the model.
        """
        return self._bounds
    def channel_axis(self):
        """
        Return the channel axis of the model.
        """
        return self._channel_axis
    def _process_input(self, input_):
        res = input_
        sub, div = self._preprocess
        if sub != 0:
            res = input_ - sub
        assert div != 0
        if div != 1:
            res /= div
        return res
    @abstractmethod
    def predict(self, image_batch):
        """
        Calculate the prediction of the image batch.
        Args:
            image_batch(numpy.ndarray): image batch of shape (batch_size, height, width, channels).
        Return:
            numpy.ndarray: predictions of the images with shape (batch_size, num_of_classes).
        """
        raise NotImplementedError
    @abstractmethod
    def num_classes(self):
        """
        Determine the number of the classes
        Return:
            int: the number of the classes
        """
        raise NotImplementedError
    @abstractmethod
    def gradient(self, image_batch):
        """
        Calculate the gradient of the cross-entropy loss w.r.t the image.
        Args:
            image_batch(list): The image and label tuple list.
        Return:
            numpy.ndarray: gradient of the cross-entropy loss w.r.t the image with
                the shape (height, width, channel).
        """
        raise NotImplementedError
--- a/adversarial/advbox/models/paddle.py
+++ b/adversarial/advbox/models/paddle.py
@ -0,0 +1,101 @@
 from __future__ import absolute_import
 import numpy as np
 import paddle.v2 as paddle
 import paddle.v2.fluid as fluid
 from paddle.v2.fluid.framework import program_guard
 from .base import Model
 class PaddleModel(Model):
    """
    Create a PaddleModel instance.
    When you need to generate a adversarial sample, you should construct an instance of PaddleModel.
    Args:
        program(paddle.v2.fluid.framework.Program): The program of the model which generate the adversarial sample.
        input_name(string): The name of the input.
        logits_name(string): The name of the logits.
        predict_name(string): The name of the predict.
        cost_name(string): The name of the loss in the program.
    """
    def __init__(self,
                 program,
                 input_name,
                 logits_name,
                 predict_name,
                 cost_name,
                 bounds,
                 channel_axis=3,
                 preprocess=None):
        super(PaddleModel, self).__init__(
            bounds=bounds, channel_axis=channel_axis, preprocess=preprocess)
        if preprocess is None:
            preprocess = (0, 1)
        self._program = program
        self._place = fluid.CPUPlace()
        self._exe = fluid.Executor(self._place)
        self._input_name = input_name
        self._logits_name = logits_name
        self._predict_name = predict_name
        self._cost_name = cost_name
        # gradient
        loss = self._program.block(0).var(self._cost_name)
        param_grads = fluid.backward.append_backward(
            loss, parameter_list=[self._input_name])
        self._gradient = dict(param_grads)[self._input_name]
    def predict(self, image_batch):
        """
            Predict the label of the image_batch.
            Args:
                image_batch(list): The image and label tuple list.
            Return:
                numpy.ndarray: predictions of the images with shape (batch_size, num_of_classes).
        """
        feeder = fluid.DataFeeder(
            feed_list=[self._input_name, self._logits_name],
            place=self._place,
            program=self._program)
        predict_var = self._program.block(0).var(self._predict_name)
        predict = self._exe.run(self._program,
                                feed=feeder.feed(image_batch),
                                fetch_list=[predict_var])
        return predict
    def num_classes(self):
        """
            Calculate the number of classes of the output label. 
        Return:
            int: the number of classes
        """
        predict_var = self._program.block(0).var(self._predict_name)
        assert len(predict_var.shape) == 2
        return predict_var.shape[1]
    def gradient(self, image_batch):
        """
        Calculate the gradient of the loss w.r.t the input.
        Args:
            image_batch(list): The image and label tuple list.
        Return:
            list: The list of the gradient of the image.
        """
        feeder = fluid.DataFeeder(
            feed_list=[self._input_name, self._logits_name],
            place=self._place,
            program=self._program)
        grad, = self._exe.run(self._program,
                              feed=feeder.feed(image_batch),
                              fetch_list=[self._gradient])
        return grad
--- a/adversarial/fluid_mnist.py
+++ b/adversarial/fluid_mnist.py
@ -0,0 +1,86 @@
 """
 CNN on mnist data using fluid api of paddlepaddle
 """
 import paddle.v2 as paddle
 import paddle.v2.fluid as fluid
 def mnist_cnn_model(img):
    """
    Mnist cnn model
    Args:
        img(Varaible): the input image to be recognized
    Returns:
        Variable: the label prediction
    """
    conv_pool_1 = fluid.nets.simple_img_conv_pool(
        input=img,
        num_filters=20,
        filter_size=5,
        pool_size=2,
        pool_stride=2,
        act='relu')
    conv_pool_2 = fluid.nets.simple_img_conv_pool(
        input=conv_pool_1,
        num_filters=50,
        filter_size=5,
        pool_size=2,
        pool_stride=2,
        act='relu')
    logits = fluid.layers.fc(input=conv_pool_2, size=10, act='softmax')
    return logits
 def main():
    """
    Train the cnn model on mnist datasets
    """
    img = fluid.layers.data(name='img', shape=[1, 28, 28], dtype='float32')
    label = fluid.layers.data(name='label', shape=[1], dtype='int64')
    logits = mnist_cnn_model(img)
    cost = fluid.layers.cross_entropy(input=logits, label=label)
    avg_cost = fluid.layers.mean(x=cost)
    optimizer = fluid.optimizer.Adam(learning_rate=0.01)
    optimizer.minimize(avg_cost)
    accuracy = fluid.evaluator.Accuracy(input=logits, label=label)
    BATCH_SIZE = 50
    PASS_NUM = 3
    ACC_THRESHOLD = 0.98
    LOSS_THRESHOLD = 10.0
    train_reader = paddle.batch(
        paddle.reader.shuffle(
            paddle.dataset.mnist.train(), buf_size=500),
        batch_size=BATCH_SIZE)
    place = fluid.CPUPlace()
    exe = fluid.Executor(place)
    feeder = fluid.DataFeeder(feed_list=[img, label], place=place)
    exe.run(fluid.default_startup_program())
    for pass_id in range(PASS_NUM):
        accuracy.reset(exe)
        for data in train_reader():
            loss, acc = exe.run(fluid.default_main_program(),
                                feed=feeder.feed(data),
                                fetch_list=[avg_cost] + accuracy.metrics)
            pass_acc = accuracy.eval(exe)
            print("pass_id=" + str(pass_id) + " acc=" + str(acc) + " pass_acc="
                  + str(pass_acc))
            if loss < LOSS_THRESHOLD and pass_acc > ACC_THRESHOLD:
                break
        pass_acc = accuracy.eval(exe)
        print("pass_id=" + str(pass_id) + " pass_acc=" + str(pass_acc))
    fluid.io.save_params(
        exe, dirname='./mnist', main_program=fluid.default_main_program())
    print('train mnist done')
 if __name__ == '__main__':
    main()
--- a/adversarial/mnist_tutorial_fgsm.py
+++ b/adversarial/mnist_tutorial_fgsm.py
@ -0,0 +1,87 @@
 """
 FGSM demos on mnist using advbox tool.
 """
 import paddle.v2 as paddle
 import paddle.v2.fluid as fluid
 import matplotlib.pyplot as plt
 import numpy as np
 from advbox.models.paddle import PaddleModel
 from advbox.attacks.gradientsign import GradientSignAttack
 def cnn_model(img):
    """
    Mnist cnn model
    Args:
        img(Varaible): the input image to be recognized
    Returns:
        Variable: the label prediction
    """
    #conv1 = fluid.nets.conv2d()
    conv_pool_1 = fluid.nets.simple_img_conv_pool(
        input=img,
        num_filters=20,
        filter_size=5,
        pool_size=2,
        pool_stride=2,
        act='relu')
    conv_pool_2 = fluid.nets.simple_img_conv_pool(
        input=conv_pool_1,
        num_filters=50,
        filter_size=5,
        pool_size=2,
        pool_stride=2,
        act='relu')
    logits = fluid.layers.fc(input=conv_pool_2, size=10, act='softmax')
    return logits
 def main():
    """
    Advbox demo which demonstrate how to use advbox.
    """
    IMG_NAME = 'img'
    LABEL_NAME = 'label'
    img = fluid.layers.data(name=IMG_NAME, shape=[1, 28, 28], dtype='float32')
    # gradient should flow
    img.stop_gradient = False
    label = fluid.layers.data(name=LABEL_NAME, shape=[1], dtype='int64')
    logits = cnn_model(img)
    cost = fluid.layers.cross_entropy(input=logits, label=label)
    avg_cost = fluid.layers.mean(x=cost)
    place = fluid.CPUPlace()
    exe = fluid.Executor(place)
    BATCH_SIZE = 1
    train_reader = paddle.batch(
        paddle.reader.shuffle(
            paddle.dataset.mnist.train(), buf_size=500),
        batch_size=BATCH_SIZE)
    feeder = fluid.DataFeeder(
        feed_list=[IMG_NAME, LABEL_NAME],
        place=place,
        program=fluid.default_main_program())
    fluid.io.load_params(
        exe, "./mnist/", main_program=fluid.default_main_program())
    # advbox demo
    m = PaddleModel(fluid.default_main_program(), IMG_NAME, LABEL_NAME,
                    logits.name, avg_cost.name, (-1, 1))
    att = GradientSignAttack(m)
    for data in train_reader():
        # fgsm attack
        adv_img = att(data)
        plt.imshow(n[0][0], cmap='Greys_r')
        plt.show()
        #np.save('adv_img', adv_img)
        break
 if __name__ == '__main__':
    main()
--- a/benchmark/IntelOptimizedPaddle.md
+++ b/benchmark/IntelOptimizedPaddle.md
@ -7,11 +7,11 @@ Machine:
 System: CentOS release 6.3 (Final), Docker 1.12.1.
-PaddlePaddle: (TODO: will rerun after 0.11.0)
+PaddlePaddle:
- paddlepaddle/paddle:latest (for MKLML and MKL-DNN)
+- paddlepaddle/paddle:0.11.0 (for MKLML and MKL-DNN)
  - MKL-DNN tag v0.11
  - MKLML 2018.0.1.20171007
- paddlepaddle/paddle:latest-openblas (for OpenBLAS)
+- paddlepaddle/paddle:0.11.0-openblas (for OpenBLAS)
  - OpenBLAS v0.2.20
 On each machine, we will test and compare the performance of training on single node using MKL-DNN / MKLML / OpenBLAS respectively.
@ -56,15 +56,15 @@ Input image size - 3 * 224 * 224, Time: images/second
 <img src="figs/googlenet-cpu-train.png" width="500">
- Alexnet
+- AlexNet
 | BatchSize    | 64     | 128    | 256    |
 |--------------|--------| ------ | -------|
-| OpenBLAS     | 2.13   | 2.45   | 2.68   | 
+| OpenBLAS     | 45.62  | 72.79  | 107.22 | 
 | MKLML        | 66.37  | 105.60 | 144.04 |
 | MKL-DNN      | 399.00 | 498.94 | 626.53 | 
-chart TBD
+<img src="figs/alexnet-cpu-train.png" width="500">
 #### Inference
 Test on batch size 1, 2, 4, 8, 16 on Intel(R) Xeon(R) Gold 6148 CPU @ 2.40GHz
@ -72,36 +72,41 @@ Test on batch size 1, 2, 4, 8, 16 on Intel(R) Xeon(R) Gold 6148 CPU @ 2.40GHz
 | BatchSize | 1     | 2     | 4     | 8     | 16    |
 |-----------|-------|-------|-------|-------|-------|
-| OpenBLAS  | 1.07  | 1.08  | 1.06  | 0.88  | 0.65  |
+| OpenBLAS  | 1.10  | 1.96  | 3.62  | 3.63  | 2.25  |
 | MKLML     | 5.58  | 9.80  | 15.15 | 21.21 | 28.67 |
 | MKL-DNN   | 75.07 | 88.64 | 82.58 | 92.29 | 96.75 |
 <img src="figs/vgg-cpu-infer.png" width="500">
 - ResNet-50
 | BatchSize | 1     | 2      | 4      | 8      | 16     |
 |-----------|-------|--------|--------|--------|--------|
-| OpenBLAS  | 3.35  | 3.19   | 3.09   | 2.55   | 1.96   |
+| OpenBLAS  | 3.31  | 6.72   | 11.59  | 13.17  | 9.27   |
 | MKLML     | 6.33  | 12.02  | 22.88  | 40.53  | 63.09  |
 | MKL-DNN   | 107.83| 148.84 | 177.78 | 189.35 | 217.69 |
 <img src="figs/resnet-cpu-infer.png" width="500">
 - GoogLeNet
 | BatchSize | 1      | 2      | 4      | 8      | 16     |
 |-----------|--------|--------|--------|--------|--------|
-| OpenBLAS  | 12.04  | 11.31  | 10.00  | 9.07   | 4.34   |
+| OpenBLAS  | 12.06  | 23.56  | 34.48  | 36.45  | 23.12  |
 | MKLML     | 22.74  | 41.56  | 81.22  | 133.47 | 210.53 |
 | MKL-DNN   | 175.10 | 272.92 | 450.70 | 512.00 | 600.94 |
- Alexnet
+<img src="figs/googlenet-cpu-infer.png" width="500">
 - AlexNet
 | BatchSize | 1      | 2      | 4      | 8      | 16     |
 |-----------|--------|--------|--------|--------|--------|
-| OpenBLAS  |    |   |   |   |    |
+| OpenBLAS  | 3.53   | 6.23   | 15.04  | 26.06  | 31.62  |
 | MKLML     | 21.32  | 36.55  | 73.06  | 131.15 | 192.77 |
 | MKL-DNN   | 442.91 | 656.41 | 719.10 | 847.68 | 850.51 |
-chart TBD
+<img src="figs/alexnet-cpu-infer.png" width="500">
 ### Laptop
 TBD
--- a/benchmark/cluster/README.md
+++ b/benchmark/cluster/README.md
@ -0,0 +1,78 @@
 # Cluster Training Benchmark
 ## Setup
 - Platform
  - Kubernetes: v1.6.2
  - Linux Kernel: v3.10.0
 - Resource
  - CPU: 10 Cores per Pod
  - Memory: 5GB per Pod
 - Docker Image
  We use different base Docker Image to run the benchmark on Kubernetes:
  - PaddlePaddle v2: paddlepaddle/paddle:0.11.0
  - PaddlePaddle Fluid: paddlepaddle/paddle:[commit-id]
  - TensorFlow: tensorflow/tensorflow:1.5.0-rc0
 - Model
  vgg16 is used in this benchmark.
 ## Cases
 - Variable
  - Batch Size of training data.
  - PServer count of the training job.
  - The number of trainers.
 - Invariant
  - The resource of trainer/pserver Pod.
 ### Measure the Performance for Different Batch Size
 - PServer Count: 40
 - Trainer Count: 100
 - Metrics: mini-batch / sec
 | Batch Size | 32 | 64 | 128 | 256 |
 | -- | -- | -- | -- | -- |
 | PaddlePaddle Fluid | - | - | - | - |
 | PaddlePaddle v2 | - | - | - | - |
 | TensorFlow | - | - | - | - |
 ### Measure the Performance for Different PServer Count
 - Trainer Count: 100
 - Batch Size: 64
 - Metrics: mini-batch / sec
 | PServer Count | 10 | 20 | 40 | 60 |
 | -- | -- | -- | -- | -- |
 | PaddlePaddle Fluid | - | - | - | - |
 | PaddlePaddle v2 | - | - | - | - |
 | TensorFlow | - | - | - | - |
 ### Measure Parallel Efficiency By Increasing Trainer Count
 - PServer Count: 20
 - Batch Size: 64
 - Metrics:
 $S = \div(T1, TN)$
 which S is the ratio of T1 over TN, training time of 1 and N trainers.
 The parallel efficiency is:
 $E = \div(S, N)$
 | Trainer Counter | 1 | 10 | 20 | 30 | 40 | 50 | 60 | 70 | 80 | 90 | 100 |
 | -- | -- | -- | -- | -- | -- | -- | -- | -- | -- | -- | -- |
 | PaddlePaddle Fluid | - | - | - | - | - | - | - | - | - | - | - |
 | PaddlePaddle v2 | - | - | - | - | - | - | - | - | - | - | - | - |
 | TensorFlow | - | - | - | - | - | - | - | - | - | - | - | - | - |
 ## Reproduce the benchmark
 TODO
--- a/benchmark/figs/alexnet-cpu-infer.png
+++ b/benchmark/figs/alexnet-cpu-infer.png
--- a/benchmark/figs/alexnet-cpu-train.png
+++ b/benchmark/figs/alexnet-cpu-train.png
--- a/benchmark/figs/googlenet-cpu-infer.png
+++ b/benchmark/figs/googlenet-cpu-infer.png
--- a/benchmark/figs/googlenet-cpu-train.png
+++ b/benchmark/figs/googlenet-cpu-train.png
--- a/benchmark/figs/resnet-cpu-infer.png
+++ b/benchmark/figs/resnet-cpu-infer.png
--- a/benchmark/figs/resnet-cpu-train.png
+++ b/benchmark/figs/resnet-cpu-train.png
--- a/benchmark/figs/vgg-cpu-infer.png
+++ b/benchmark/figs/vgg-cpu-infer.png
--- a/benchmark/figs/vgg-cpu-train.png
+++ b/benchmark/figs/vgg-cpu-train.png
--- a/benchmark/paddle/image/plotlog.py
+++ b/benchmark/paddle/image/plotlog.py
@ -0,0 +1,114 @@
 # Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 import sys
 import argparse
 import matplotlib.pyplot as plt
 def parse_args():
    parser = argparse.ArgumentParser('Parse Log')
    parser.add_argument(
        '--file_path', '-f', type=str, help='the path of the log file')
    parser.add_argument(
        '--sample_rate',
        '-s',
        type=float,
        default=1.0,
        help='the rate to take samples from log')
    parser.add_argument(
        '--log_period', '-p', type=int, default=1, help='the period of log')
    args = parser.parse_args()
    return args
 def parse_file(file_name):
    loss = []
    error = []
    with open(file_name) as f:
        for i, line in enumerate(f):
            line = line.strip()
            if not line.startswith('pass'):
                continue
            line_split = line.split(' ')
            if len(line_split) != 5:
                continue
            loss_str = line_split[2][:-1]
            cur_loss = float(loss_str.split('=')[-1])
            loss.append(cur_loss)
            err_str = line_split[3][:-1]
            cur_err = float(err_str.split('=')[-1])
            error.append(cur_err)
    accuracy = [1.0 - err for err in error]
    return loss, accuracy
 def sample(metric, sample_rate):
    interval = int(1.0 / sample_rate)
    if interval > len(metric):
        return metric[:1]
    num = len(metric) / interval
    idx = [interval * i for i in range(num)]
    metric_sample = [metric[id] for id in idx]
    return metric_sample
 def plot_metric(metric,
                batch_id,
                graph_title,
                line_style='b-',
                line_label='y',
                line_num=1):
    plt.figure()
    plt.title(graph_title)
    if line_num == 1:
        plt.plot(batch_id, metric, line_style, label=line_label)
    else:
        for i in range(line_num):
            plt.plot(batch_id, metric[i], line_style[i], label=line_label[i])
    plt.xlabel('batch')
    plt.ylabel(graph_title)
    plt.legend()
    plt.savefig(graph_title + '.jpg')
    plt.close()
 def main():
    args = parse_args()
    assert args.sample_rate > 0. and args.sample_rate <= 1.0, "The sample rate should in the range (0, 1]."
    loss, accuracy = parse_file(args.file_path)
    batch = [args.log_period * i for i in range(len(loss))]
    batch_sample = sample(batch, args.sample_rate)
    loss_sample = sample(loss, args.sample_rate)
    accuracy_sample = sample(accuracy, args.sample_rate)
    plot_metric(loss_sample, batch_sample, 'loss', line_label='loss')
    plot_metric(
        accuracy_sample,
        batch_sample,
        'accuracy',
        line_style='g-',
        line_label='accuracy')
 if __name__ == '__main__':
    main()
--- a/benchmark/paddle/image/run_openblas_infer.sh
+++ b/benchmark/paddle/image/run_openblas_infer.sh
@ -8,6 +8,7 @@ function clock_to_seconds() {
 }
 function infer() {
  export OPENBLAS_MAIN_FREE=1
  topology=$1
  layer_num=$2
  bs=$3
--- a/cmake/external/mkldnn.cmake
+++ b/cmake/external/mkldnn.cmake
@ -63,9 +63,30 @@ ExternalProject_Add(
                        -DMKLROOT:PATH=${MKLML_ROOT}
 )
-ADD_LIBRARY(mkldnn SHARED IMPORTED GLOBAL)
+ADD_LIBRARY(shared_mkldnn SHARED IMPORTED GLOBAL)
-SET_PROPERTY(TARGET mkldnn PROPERTY IMPORTED_LOCATION ${MKLDNN_LIB})
+SET_PROPERTY(TARGET shared_mkldnn PROPERTY IMPORTED_LOCATION ${MKLDNN_LIB})
-ADD_DEPENDENCIES(mkldnn ${MKLDNN_PROJECT})
+ADD_DEPENDENCIES(shared_mkldnn ${MKLDNN_PROJECT})
 MESSAGE(STATUS "MKLDNN library: ${MKLDNN_LIB}")
 add_definitions(-DPADDLE_WITH_MKLDNN)
-LIST(APPEND external_project_dependencies mkldnn)
+LIST(APPEND external_project_dependencies shared_mkldnn)
 # generate a static dummy target to track mkldnn dependencies
 # for cc_library(xxx SRCS xxx.c DEPS mkldnn)
 SET(dummyfile ${CMAKE_CURRENT_BINARY_DIR}/mkldnn_dummy.c)
 FILE(WRITE ${dummyfile} "const char * dummy = \"${dummyfile}\";")
 ADD_LIBRARY(mkldnn STATIC ${dummyfile})
 TARGET_LINK_LIBRARIES(mkldnn ${MKLDNN_LIB} ${MKLML_LIB} ${MKLML_IOMP_LIB})
 ADD_DEPENDENCIES(mkldnn ${MKLDNN_PROJECT})
 # copy the real so.0 lib to install dir
 # it can be directly contained in wheel or capi
 SET(MKLDNN_SHARED_LIB ${MKLDNN_INSTALL_DIR}/libmkldnn.so.0)
 ADD_CUSTOM_COMMAND(OUTPUT ${MKLDNN_SHARED_LIB}
    COMMAND cp ${MKLDNN_LIB} ${MKLDNN_SHARED_LIB}
    DEPENDS mkldnn)
 ADD_CUSTOM_TARGET(mkldnn_shared_lib ALL DEPENDS ${MKLDNN_SHARED_LIB})
 IF(WITH_C_API)
  INSTALL(FILES ${MKLDNN_SHARED_LIB} DESTINATION lib)
 ENDIF()
--- a/cmake/external/mklml.cmake
+++ b/cmake/external/mklml.cmake
@ -66,3 +66,7 @@ ADD_LIBRARY(mklml SHARED IMPORTED GLOBAL)
 SET_PROPERTY(TARGET mklml PROPERTY IMPORTED_LOCATION ${MKLML_LIB})
 ADD_DEPENDENCIES(mklml ${MKLML_PROJECT})
 LIST(APPEND external_project_dependencies mklml)
 IF(WITH_C_API)
  INSTALL(FILES ${MKLML_LIB} ${MKLML_IOMP_LIB} DESTINATION lib)
 ENDIF()
--- a/cmake/external/warpctc.cmake
+++ b/cmake/external/warpctc.cmake
@ -63,7 +63,7 @@ ExternalProject_Add(
 MESSAGE(STATUS "warp-ctc library: ${WARPCTC_LIBRARIES}")
 INCLUDE_DIRECTORIES(${WARPCTC_INCLUDE_DIR})
-ADD_LIBRARY(warpctc STATIC IMPORTED GLOBAL)
+ADD_LIBRARY(warpctc SHARED IMPORTED GLOBAL)
 SET_PROPERTY(TARGET warpctc PROPERTY IMPORTED_LOCATION ${WARPCTC_LIBRARIES})
 ADD_DEPENDENCIES(warpctc extern_warpctc)
--- a/doc/api/v2/fluid.rst
+++ b/doc/api/v2/fluid.rst
@ -15,4 +15,4 @@ Fluid
    fluid/param_attr.rst
    fluid/profiler.rst
    fluid/regularizer.rst
-
+    fluid/io.rst
--- a/Show More
+++ b/Show More