Merge remote-tracking branch 'upstream/develop' into develop

9 years ago · c9baf82447
parent dc6859f1e0 df561fe541
commit c9baf82447
706 changed files with 26121 additions and 18010 deletions
--- a/.clang-format
+++ b/.clang-format
@ -13,8 +13,6 @@
 # The document of clang-format is 
 #   http://clang.llvm.org/docs/ClangFormat.html
 #   http://clang.llvm.org/docs/ClangFormatStyleOptions.html
 #
 # TODO(yuyang18): Add python and other language code style
 ---
 Language:        Cpp
 BasedOnStyle:  Google
@ -22,8 +20,9 @@ IndentWidth:     2
 TabWidth:        2
 ContinuationIndentWidth: 4
 AccessModifierOffset: -2  # The private/protected/public has no indent in class
 PointerAlignment: Left    # int* p/int& p, not int *p/int &p
 Standard:  Cpp11 
 AllowAllParametersOfDeclarationOnNextLine: true
 BinPackParameters: false
 BinPackArguments: false
 ...
--- a/.gitignore
+++ b/.gitignore
@ -5,4 +5,6 @@ build/
 .vscode
 .idea
 .project
 .cproject
 .pydevproject
 Makefile
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@ -0,0 +1,20 @@
 -   repo: https://github.com/Lucas-C/pre-commit-hooks.git
    sha: c25201a00e6b0514370501050cf2a8538ac12270
    hooks:
    -   id: remove-crlf
 -   repo: https://github.com/reyoung/mirrors-yapf.git
    sha: v0.13.2
    hooks:
    -   id: yapf
 -   repo: https://github.com/pre-commit/pre-commit-hooks
    sha: 7539d8bd1a00a3c1bfd34cdb606d3a6372e83469
    hooks:
    -   id: check-added-large-files
    -   id: check-merge-conflict
    -   id: check-symlinks
    -   id: detect-private-key
    -   id: end-of-file-fixer
 -   repo: https://github.com/PaddlePaddle/clang-format-pre-commit-hook.git
    sha: 28c0ea8a67a3e2dbbf4822ef44e85b63a0080a29
    hooks:
    -   id: clang-formater
--- a/.style.yapf
+++ b/.style.yapf
@ -0,0 +1,3 @@
 [style]
 based_on_style = pep8
 column_limit = 80
--- a/.travis.yml
+++ b/.travis.yml
@ -38,10 +38,19 @@ addons:
      - curl
      - lcov
      - graphviz
      - swig
 before_install:
  - |
    if [ ${JOB} == "BUILD_AND_TEST" ]; then
      if ! git diff --name-only $TRAVIS_COMMIT_RANGE | grep -qvE '(\.md$)'
      then
        echo "Only markdown docs were updated, stopping build process."
        exit
      fi
    fi
  - if [[ "$TRAVIS_OS_NAME" == "linux" ]]; then sudo paddle/scripts/travis/before_install.linux.sh; fi
  - if [[ "$TRAVIS_OS_NAME" == "osx" ]]; then paddle/scripts/travis/before_install.osx.sh; fi
-  - pip install wheel protobuf sphinx breathe recommonmark
+  - pip install wheel protobuf sphinx breathe recommonmark virtualenv numpy
 script:
  - paddle/scripts/travis/main.sh
 notifications:
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@ -2,8 +2,8 @@ cmake_minimum_required(VERSION 2.8)
 project(paddle CXX C)
 set(PADDLE_MAJOR_VERSION 0)
-set(PADDLE_MINOR_VERSION 8)
+set(PADDLE_MINOR_VERSION 9)
-set(PADDLE_PATCH_VERSION 0b3)
+set(PADDLE_PATCH_VERSION 0a0)
 set(PADDLE_VERSION ${PADDLE_MAJOR_VERSION}.${PADDLE_MINOR_VERSION}.${PADDLE_PATCH_VERSION})
 set(CMAKE_MODULE_PATH ${CMAKE_MODULE_PATH} "${CMAKE_SOURCE_DIR}/cmake")
@ -95,11 +95,24 @@ if(NOT WITH_GPU)
    add_definitions(-DHPPL_STUB_FUNC)
    list(APPEND CMAKE_CXX_SOURCE_FILE_EXTENSIONS cu)
 else()
    if(${CUDA_VERSION_MAJOR} GREATER 6)
        if(COMPILER_SUPPORT_CXX11)
            LIST(APPEND CUDA_NVCC_FLAGS -std=c++11)
        endif()
    endif()
    # TODO(yuyang18): Change it to remove std=c++11 in cuda compile.
    set(CUDA_PROPAGATE_HOST_FLAGS OFF)
    if(NOT CUDNN_FOUND)
        message(FATAL_ERROR "Paddle need cudnn to compile")
    endif()
    set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS} "-g -O3 --use_fast_math")
    if(WITH_AVX)
        set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS} "-Xcompiler ${AVX_FLAG}")
    else(WITH_AVX)
        set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS} "-Xcompiler ${SSE3_FLAG}")
    endif(WITH_AVX)
    if(WITH_DSO)
        set(CUDA_LIBRARIES "")
@ -123,11 +136,11 @@ if(NOT WITH_TIMER)
 endif(NOT WITH_TIMER)
 if(WITH_AVX)
-    set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} ${AVX_FLAGS}")
+    set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} ${AVX_FLAG}")
-    set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${AVX_FLAGS}")
+    set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${AVX_FLAG}")
 else(WITH_AVX)
-    set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -msse3")
+    set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} ${SSE3_FLAG}")
-    set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -msse3")
+    set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${SSE3_FLAG}")
 endif(WITH_AVX)
 if(WITH_PYTHON)
--- a/ISSUE_TEMPLATE.md
+++ b/ISSUE_TEMPLATE.md
@ -7,7 +7,7 @@ Before submitting the issue, look over the following criteria before handing you
 - [ ] Was there a similar issue submitted or resolved before ? You could search issue in the github.
 - [ ] Did you retrieve your issue from widespread search engines ?
 - [ ] Is my description of the issue clear enough to reproduce this problem?
-   * If some errors occured, we need details about `how do you run your code?`, `what system do you use?`, `Are you using GPU or not?`, etc.
+   * If some errors occurred, we need details about `how do you run your code?`, `what system do you use?`, `Are you using GPU or not?`, etc.
   * If you use an recording [asciinema](https://asciinema.org/) to show what you are doing to make it happen, that's awesome! We could help you solve the problem more quickly.
 - [ ] Is my description of the issue use the github markdown correctly?
   * Please use the proper markdown syntaxes for styling all forms of writing, e.g, source code, error information, etc.
--- a/README.md
+++ b/README.md
@ -1,10 +1,13 @@
 # PaddlePaddle
-[![Build Status](https://travis-ci.org/baidu/Paddle.svg?branch=master)](https://travis-ci.org/baidu/Paddle)
+[![Build Status](https://travis-ci.org/PaddlePaddle/Paddle.svg?branch=develop)](https://travis-ci.org/PaddlePaddle/Paddle)
-[![Coverage Status](https://coveralls.io/repos/github/baidu/Paddle/badge.svg?branch=develop)](https://coveralls.io/github/baidu/Paddle?branch=develop)
+[![Documentation Status](https://img.shields.io/badge/docs-latest-brightgreen.svg?style=flat)](http://www.paddlepaddle.org/)
-[![Join the chat at https://gitter.im/PaddlePaddle/Deep_Learning](https://badges.gitter.im/Join%20Chat.svg)](https://gitter.im/PaddlePaddle/Deep_Learning?utm_source=badge&utm_medium=badge&utm_campaign=pr-badge&utm_content=badge)
+[![Documentation Status](https://img.shields.io/badge/中文文档-最新-brightgreen.svg)](http://www.paddlepaddle.org/cn/index.html)
-[![License](https://img.shields.io/badge/license-Apache%202.0-green.svg)](LICENSE)
+[![Coverage Status](https://coveralls.io/repos/github/PaddlePaddle/Paddle/badge.svg?branch=develop)](https://coveralls.io/github/PaddlePaddle/Paddle?branch=develop)
 [![Release](https://img.shields.io/github/release/PaddlePaddle/Paddle.svg)](https://github.com/PaddlePaddle/Paddle/releases)
 [![License](https://img.shields.io/badge/license-Apache%202-blue.svg)](LICENSE)
 Welcome to the PaddlePaddle GitHub.
@ -14,7 +17,7 @@ developed by Baidu scientists and engineers for the purpose of applying deep
 learning to many products at Baidu.
 Our vision is to enable deep learning for everyone via PaddlePaddle.
-Please refer to our [release log](https://github.com/baidu/Paddle/releases) to track the latest feature of PaddlePaddle. 
+Please refer to our [release announcement](https://github.com/PaddlePaddle/Paddle/releases) to track the latest feature of PaddlePaddle.
 ## Features
@ -26,15 +29,15 @@ Please refer to our [release log](https://github.com/baidu/Paddle/releases) to t
    connection.
 -  **Efficiency**
-  
+
    In order to unleash the power of heterogeneous computing resource,
    optimization occurs at different levels of PaddlePaddle, including
    computing, memory, architecture and communication. The following are some
    examples:
      - Optimized math operations through SSE/AVX intrinsics, BLAS libraries
-      (e.g. MKL, ATLAS, cuBLAS) or customized CPU/GPU kernels. 
+      (e.g. MKL, ATLAS, cuBLAS) or customized CPU/GPU kernels.
-      - Highly optimized recurrent networks which can handle **variable-length** 
+      - Highly optimized recurrent networks which can handle **variable-length**
      sequence without padding.
      - Optimized local and distributed training for models with high dimensional
      sparse data.
@ -57,41 +60,39 @@ Please refer to our [release log](https://github.com/baidu/Paddle/releases) to t
 ## Installation
 Check out the [Install Guide](http://paddlepaddle.org/doc/build/) to install from
-pre-built packages (**docker image**, **deb package**) or 
+pre-built packages (**docker image**, **deb package**) or
 directly build on **Linux** and **Mac OS X** from the source code.
- 
+
 ## Documentation
 Both [English Docs](http://paddlepaddle.org/doc/) and [Chinese Docs](http://paddlepaddle.org/doc_cn/) are provided for our users and developers.
 - [Quick Start](http://paddlepaddle.org/doc/demo/quick_start/index_en) <br>
   You can follow the quick start tutorial to learn how use PaddlePaddle
   step-by-step.
-    
+
 - [Example and Demo](http://paddlepaddle.org/doc/demo/) <br>
   We provide five demos, including: image classification, sentiment analysis,
-   sequence to sequence model, recommendation, semantic role labeling. 
+   sequence to sequence model, recommendation, semantic role labeling.
-   
+
 - [Distributed Training](http://paddlepaddle.org/doc/cluster) <br>
  This system supports training deep learning models on multiple machines
  with data parallelism.
-   
+
 - [Python API](http://paddlepaddle.org/doc/ui/) <br>
   PaddlePaddle supports using either Python interface or C++ to build your
   system. We also use SWIG to wrap C++ source code to create a user friendly
   interface for Python. You can also use SWIG to create interface for your
   favorite programming language.
- 
+
 - [How to Contribute](http://paddlepaddle.org/doc/build/contribute_to_paddle.html) <br>
   We sincerely appreciate your interest and contributions. If you would like to
-   contribute, please read the contribution guide.   
+   contribute, please read the contribution guide.
 - [Source Code Documents](http://paddlepaddle.org/doc/source/) <br>
 ## Ask Questions
-Please join the [**gitter chat**](https://gitter.im/PaddlePaddle/Deep_Learning) or send email to
+
-**paddle-dev@baidu.com** to ask questions and talk about methods and models.
+You are welcome to submit questions and bug reports as [Github Issues](https://github.com/PaddlePaddle/Paddle/issues).
 Framework development discussions and
 bug reports are collected on [Issues](https://github.com/baidu/paddle/issues).
 ## Copyright and License
 PaddlePaddle is provided under the [Apache-2.0 license](LICENSE).
--- a/cmake/FindAVX.cmake
+++ b/cmake/FindAVX.cmake
@ -3,36 +3,55 @@
 INCLUDE(CheckCXXSourceRuns)
 SET(FIND_AVX_10)
 SET(FIND_AVX_20)
 SET(AVX_FLAGS)
 SET(AVX_FOUND)
 # Check AVX 2
 SET(CMAKE_REQUIRED_FLAGS)
 IF(CMAKE_COMPILER_IS_GNUCC OR CMAKE_COMPILER_IS_GNUCXX OR CMAKE_CXX_COMPILER_ID MATCHES "Clang")
-  SET(CMAKE_REQUIRED_FLAGS "-mavx2")
+    set(MMX_FLAG "-mmmx")
-ELSEIF(MSVC AND NOT CMAKE_CL_64)  # reserve for WINDOWS
+    set(SSE2_FLAG "-msse2")
-  SET(CMAKE_REQUIRED_FLAGS "/arch:AVX2")
+    set(SSE3_FLAG "-msse3")
    SET(AVX_FLAG "-mavx")
    SET(AVX2_FLAG "-mavx2")
 ELSEIF(MSVC)
    set(MMX_FLAG "/arch:MMX")
    set(SSE2_FLAG "/arch:SSE2")
    set(SSE3_FLAG "/arch:SSE3")
    SET(AVX_FLAG "/arch:AVX")
    SET(AVX2_FLAG "/arch:AVX2")
 ENDIF()
 # Check  MMX
 set(CMAKE_REQUIRED_FLAGS ${MMX_FLAG})
 CHECK_CXX_SOURCE_RUNS("
-#include <immintrin.h>
+#include <mmintrin.h>
 int main()
 {
-    __m256i a = _mm256_set_epi32 (-1, 2, -3, 4, -1, 2, -3, 4);
+    _mm_setzero_si64();
    __m256i result = _mm256_abs_epi32 (a);
    return 0;
-}" FIND_AVX_20)
+}" MMX_FOUND)
-# Check AVX
+# Check SSE2
-SET(CMAKE_REQUIRED_FLAGS)
+set(CMAKE_REQUIRED_FLAGS ${SSE2_FLAG})
-IF(CMAKE_COMPILER_IS_GNUCC OR CMAKE_COMPILER_IS_GNUCXX OR CMAKE_CXX_COMPILER_ID MATCHES "Clang")
+CHECK_CXX_SOURCE_RUNS("
-    SET(CMAKE_REQUIRED_FLAGS "-mavx")
+#include <emmintrin.h>
-ELSEIF(MSVC AND NOT CMAKE_CL_64)
+int main()
-    SET(CMAKE_REQUIRED_FLAGS "/arch:AVX")
+{
-endif()
+    _mm_setzero_si128();
    return 0;
 }" SSE2_FOUND)
 # Check SSE3
 set(CMAKE_REQUIRED_FLAGS ${SSE3_FLAG})
 CHECK_CXX_SOURCE_RUNS("
 #include <pmmintrin.h>
 int main()
 {
    __m128d a = _mm_set1_pd(6.28);
    __m128d b = _mm_set1_pd(3.14);
    __m128d result = _mm_addsub_pd(a, b);
    result = _mm_movedup_pd(result);
    return 0;
 }" SSE3_FOUND)
 # Check AVX
 set(CMAKE_REQUIRED_FLAGS ${AVX_FLAG})
 CHECK_CXX_SOURCE_RUNS("
 #include <immintrin.h>
 int main()
@ -41,25 +60,17 @@ int main()
    __m256 b = _mm256_set_ps (1.0f, 2.0f, 3.0f, 4.0f, 1.0f, 2.0f, 3.0f, 4.0f);
    __m256 result = _mm256_add_ps (a, b);
    return 0;
-}" FIND_AVX_10)
+}" AVX_FOUND)
 IF(${FIND_AVX_20})
    IF(CMAKE_COMPILER_IS_GNUCC OR CMAKE_COMPILER_IS_GNUCXX OR CMAKE_CXX_COMPILER_ID MATCHES "Clang")
        SET(AVX_FLAGS "${AVX_FLAGS} -mavx2")
    ELSEIF(MSVC)
        SET(AVX_FLAGS "${AVX_FLAGS} /arch:AVX2")
    ENDIF()
 ENDIF()
-IF(${FIND_AVX_10})
+# Check AVX 2
-    IF(CMAKE_COMPILER_IS_GNUCC OR CMAKE_COMPILER_IS_GNUCXX OR CMAKE_CXX_COMPILER_ID MATCHES "Clang")
+set(CMAKE_REQUIRED_FLAGS ${AVX2_FLAG})
-        SET(AVX_FLAGS "${AVX_FLAGS} -mavx")
+CHECK_CXX_SOURCE_RUNS("
-    ELSEIF(MSVC)
+#include <immintrin.h>
-        SET(AVX_FLAGS "${AVX_FLAGS} /arch:AVX")
+int main()
-    ENDIF()
+{
-ENDIF()
+    __m256i a = _mm256_set_epi32 (-1, 2, -3, 4, -1, 2, -3, 4);
    __m256i result = _mm256_abs_epi32 (a);
    return 0;
 }" AVX2_FOUND)
-IF(${FIND_AVX_10})
+mark_as_advanced(MMX_FOUND SSE2_FOUND SSE3_FOUND AVX_FOUND AVX2_FOUND)
    SET(AVX_FOUND TRUE)
    MESSAGE(STATUS "Find CPU supports ${AVX_FLAGS}.")
 ENDIF()
--- a/cmake/util.cmake
+++ b/cmake/util.cmake
@ -188,14 +188,6 @@ macro(add_simple_unittest TARGET_NAME)
    add_unittest(${TARGET_NAME} ${TARGET_NAME}.cpp)
 endmacro()
 macro(add_paddle_culib TARGET_NAME)
    set(NVCC_FLAG ${CUDA_NVCC_FLAGS})
    set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS};--use_fast_math)
    cuda_add_library(${TARGET_NAME} STATIC ${ARGN})
    set(CUDA_NVCC_FLAGS ${NVCC_FLAG})
 endmacro()
 # Creates C resources file from files in given resource file
 function(create_resources res_file output)
    # Create empty output file
--- a/demo/image_classification/.gitignore
+++ b/demo/image_classification/.gitignore
@ -5,3 +5,5 @@ plot.png
 train.log
 image_provider_copy_1.py
 *pyc
 train.list
 test.list
--- a/demo/image_classification/data/download_cifar.sh
+++ b/demo/image_classification/data/download_cifar.sh
--- a/demo/image_classification/data/process_cifar.py
+++ b/demo/image_classification/data/process_cifar.py
@ -16,7 +16,6 @@ import numpy as np
 import sys
 import os
 import PIL.Image as Image
 """
  Usage: python process_cifar input_dir output_dir
 """
@ -30,6 +29,7 @@ def mkdir_not_exist(path):
    if not os.path.exists(path):
        os.mkdir(path)
 def create_dir_structure(output_dir):
    """
    Create the directory structure for the directory.
@ -39,8 +39,8 @@ def create_dir_structure(output_dir):
    mkdir_not_exist(os.path.join(output_dir, "train"))
    mkdir_not_exist(os.path.join(output_dir, "test"))
-def convert_batch(batch_path, label_set, label_map,
+
-                  output_dir, data_split):
+def convert_batch(batch_path, label_set, label_map, output_dir, data_split):
    """
    Convert CIFAR batch to the structure of Paddle format.
    batch_path: the batch to be converted.
@ -67,11 +67,23 @@ if __name__ == '__main__':
    output_dir = sys.argv[2]
    num_batch = 5
    create_dir_structure(output_dir)
-    label_map = {0: "airplane", 1: "automobile", 2: "bird", 3: "cat", 4: "deer",
+    label_map = {
-                 5: "dog", 6: "frog", 7: "horse", 8: "ship", 9: "truck"}
+        0: "airplane",
        1: "automobile",
        2: "bird",
        3: "cat",
        4: "deer",
        5: "dog",
        6: "frog",
        7: "horse",
        8: "ship",
        9: "truck"
    }
    labels = {}
    for i in range(1, num_batch + 1):
-        convert_batch(os.path.join(input_dir, "data_batch_%d" % i), labels,
+        convert_batch(
-                      label_map, output_dir, "train")
+            os.path.join(input_dir, "data_batch_%d" % i), labels, label_map,
-    convert_batch(os.path.join(input_dir, "test_batch"), {},
+            output_dir, "train")
-                  label_map, output_dir, "test")
+    convert_batch(
        os.path.join(input_dir, "test_batch"), {}, label_map, output_dir,
        "test")
--- a/demo/image_classification/image_provider.py
+++ b/demo/image_classification/image_provider.py
@ -46,36 +46,41 @@ def hook(settings, img_size, mean_img_size, num_classes, color, meta, use_jpeg,
    settings.img_mean = image_util.load_meta(settings.meta_path,
                                             settings.mean_img_size,
-                                             settings.img_size,
+                                             settings.img_size, settings.color)
                                             settings.color)
    settings.logger.info('Image size: %s', settings.img_size)
    settings.logger.info('Meta path: %s', settings.meta_path)
    settings.input_types = [
        dense_vector(settings.img_raw_size),  # image feature
-        integer_value(settings.num_classes)]  # labels
+        integer_value(settings.num_classes)
    ]  # labels
    settings.logger.info('DataProvider Initialization finished')
-@provider(init_hook=hook)
+@provider(init_hook=hook, min_pool_size=0)
-def processData(settings, file_name):
+def processData(settings, file_list):
    """
    The main function for loading data.
    Load the batch, iterate all the images and labels in this batch.
-    file_name: the batch file name.
+    file_list: the batch file list.
    """
-    data = cPickle.load(io.open(file_name, 'rb'))
+    with open(file_list, 'r') as fdata:
-    indexes = list(range(len(data['images'])))
+        lines = [line.strip() for line in fdata]
-    if settings.is_train:
+        random.shuffle(lines)
-        random.shuffle(indexes)
+        for file_name in lines:
-    for i in indexes:
+            with io.open(file_name.strip(), 'rb') as file:
-        if settings.use_jpeg == 1:
+                data = cPickle.load(file)
-            img = image_util.decode_jpeg(data['images'][i])
+                indexes = list(range(len(data['images'])))
-        else:
+                if settings.is_train:
-            img = data['images'][i]
+                    random.shuffle(indexes)
-        img_feat = image_util.preprocess_img(img, settings.img_mean,
+                for i in indexes:
-                                             settings.img_size, settings.is_train,
+                    if settings.use_jpeg == 1:
-                                             settings.color)
+                        img = image_util.decode_jpeg(data['images'][i])
-        label = data['labels'][i]
+                    else:
-        yield img_feat.tolist(), int(label)
+                        img = data['images'][i]
                    img_feat = image_util.preprocess_img(
                        img, settings.img_mean, settings.img_size,
                        settings.is_train, settings.color)
                    label = data['labels'][i]
                    yield img_feat.astype('float32'), int(label)
--- a/demo/image_classification/image_util.py
+++ b/demo/image_classification/image_util.py
@ -16,17 +16,20 @@ import numpy as np
 from PIL import Image
 from cStringIO import StringIO
 def resize_image(img, target_size):
    """
    Resize an image so that the shorter edge has length target_size.
    img: the input image to be resized.
    target_size: the target resized image size.
    """
-    percent = (target_size/float(min(img.size[0], img.size[1])))
+    percent = (target_size / float(min(img.size[0], img.size[1])))
-    resized_size = int(round(img.size[0] * percent)), int(round(img.size[1] * percent))
+    resized_size = int(round(img.size[0] * percent)), int(
        round(img.size[1] * percent))
    img = img.resize(resized_size, Image.ANTIALIAS)
    return img
 def flip(im):
    """
    Return the flipped image.
@ -38,6 +41,7 @@ def flip(im):
    else:
        return im[:, ::-1]
 def crop_img(im, inner_size, color=True, test=True):
    """
    Return cropped image.
@ -50,20 +54,22 @@ def crop_img(im, inner_size, color=True, test=True):
      If True, crop the center of images.
    """
    if color:
-        height, width = max(inner_size, im.shape[1]), max(inner_size, im.shape[2])
+        height, width = max(inner_size, im.shape[1]), max(inner_size,
                                                          im.shape[2])
        padded_im = np.zeros((3, height, width))
        startY = (height - im.shape[1]) / 2
        startX = (width - im.shape[2]) / 2
        endY, endX = startY + im.shape[1], startX + im.shape[2]
-        padded_im[:, startY: endY, startX: endX] = im
+        padded_im[:, startY:endY, startX:endX] = im
    else:
        im = im.astype('float32')
-        height, width = max(inner_size, im.shape[0]), max(inner_size, im.shape[1])
+        height, width = max(inner_size, im.shape[0]), max(inner_size,
                                                          im.shape[1])
        padded_im = np.zeros((height, width))
        startY = (height - im.shape[0]) / 2
        startX = (width - im.shape[1]) / 2
        endY, endX = startY + im.shape[0], startX + im.shape[1]
-        padded_im[startY: endY, startX: endX] = im
+        padded_im[startY:endY, startX:endX] = im
    if test:
        startY = (height - inner_size) / 2
        startX = (width - inner_size) / 2
@ -72,19 +78,21 @@ def crop_img(im, inner_size, color=True, test=True):
        startX = np.random.randint(0, width - inner_size + 1)
    endY, endX = startY + inner_size, startX + inner_size
    if color:
-        pic = padded_im[:, startY: endY, startX: endX]
+        pic = padded_im[:, startY:endY, startX:endX]
    else:
-        pic = padded_im[startY: endY, startX: endX]
+        pic = padded_im[startY:endY, startX:endX]
    if (not test) and (np.random.randint(2) == 0):
        pic = flip(pic)
    return pic
 def decode_jpeg(jpeg_string):
    np_array = np.array(Image.open(StringIO(jpeg_string)))
    if len(np_array.shape) == 3:
        np_array = np.transpose(np_array, (2, 0, 1))
    return np_array
 def preprocess_img(im, img_mean, crop_size, is_train, color=True):
    """
    Does data augmentation for images.
@ -99,6 +107,7 @@ def preprocess_img(im, img_mean, crop_size, is_train, color=True):
    pic -= img_mean
    return pic.flatten()
 def load_meta(meta_path, mean_img_size, crop_size, color=True):
    """
    Return the loaded meta file.
@ -109,17 +118,18 @@ def load_meta(meta_path, mean_img_size, crop_size, color=True):
    mean = np.load(meta_path)['data_mean']
    border = (mean_img_size - crop_size) / 2
    if color:
-        assert(mean_img_size * mean_img_size * 3 == mean.shape[0])
+        assert (mean_img_size * mean_img_size * 3 == mean.shape[0])
        mean = mean.reshape(3, mean_img_size, mean_img_size)
-        mean = mean[:, border: border + crop_size,
+        mean = mean[:, border:border + crop_size, border:border +
-                       border: border + crop_size].astype('float32')
+                    crop_size].astype('float32')
    else:
-        assert(mean_img_size * mean_img_size == mean.shape[0])
+        assert (mean_img_size * mean_img_size == mean.shape[0])
        mean = mean.reshape(mean_img_size, mean_img_size)
-        mean = mean[border: border + crop_size,
+        mean = mean[border:border + crop_size, border:border +
-                    border: border + crop_size].astype('float32')
+                    crop_size].astype('float32')
    return mean
 def load_image(img_path, is_color=True):
    """
    Load image and return. 
@ -130,6 +140,7 @@ def load_image(img_path, is_color=True):
    img.load()
    return img
 def oversample(img, crop_dims):
    """
    image : iterable of (H x W x K) ndarrays
@ -152,50 +163,53 @@ def oversample(img, crop_dims):
        for j in w_indices:
            crops_ix[curr] = (i, j, i + crop_dims[0], j + crop_dims[1])
            curr += 1
-    crops_ix[4] = np.tile(im_center, (1, 2)) + np.concatenate([
+    crops_ix[4] = np.tile(im_center, (1, 2)) + np.concatenate(
-        -crop_dims / 2.0,
+        [-crop_dims / 2.0, crop_dims / 2.0])
         crop_dims / 2.0
    ])
    crops_ix = np.tile(crops_ix, (2, 1))
    # Extract crops
-    crops = np.empty((10 * len(img), crop_dims[0], crop_dims[1],
+    crops = np.empty(
-                      im_shape[-1]), dtype=np.float32)
+        (10 * len(img), crop_dims[0], crop_dims[1], im_shape[-1]),
        dtype=np.float32)
    ix = 0
    for im in img:
        for crop in crops_ix:
            crops[ix] = im[crop[0]:crop[2], crop[1]:crop[3], :]
            ix += 1
-        crops[ix-5:ix] = crops[ix-5:ix, :, ::-1, :]  # flip for mirrors
+        crops[ix - 5:ix] = crops[ix - 5:ix, :, ::-1, :]  # flip for mirrors
    return crops
 class ImageTransformer:
-    def __init__(self, transpose = None,
+    def __init__(self,
-                 channel_swap = None, mean = None, is_color = True):
+                 transpose=None,
                 channel_swap=None,
                 mean=None,
                 is_color=True):
        self.transpose = transpose
        self.channel_swap = None
        self.mean = None
-        self.is_color = is_color 
+        self.is_color = is_color
-    def set_transpose(self, order): 
+    def set_transpose(self, order):
        if self.is_color:
-            assert 3 == len(order) 
+            assert 3 == len(order)
        self.transpose = order
-    def set_channel_swap(self, order): 
+    def set_channel_swap(self, order):
        if self.is_color:
-            assert 3 == len(order) 
+            assert 3 == len(order)
        self.channel_swap = order
    def set_mean(self, mean):
        # mean value, may be one value per channel 
        if mean.ndim == 1:
-            mean = mean[:, np.newaxis, np.newaxis]       
+            mean = mean[:, np.newaxis, np.newaxis]
-        else: 
+        else:
            # elementwise mean
            if self.is_color:
                assert len(mean.shape) == 3
-        self.mean = mean 
+        self.mean = mean
    def transformer(self, data):
        if self.transpose is not None:
--- a/demo/image_classification/prediction.py
+++ b/demo/image_classification/prediction.py
@ -12,7 +12,7 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
-import os,sys
+import os, sys
 import numpy as np
 import logging
 from PIL import Image
@ -24,9 +24,11 @@ from py_paddle import swig_paddle, DataProviderConverter
 from paddle.trainer.PyDataProvider2 import dense_vector
 from paddle.trainer.config_parser import parse_config
-logging.basicConfig(format='[%(levelname)s %(asctime)s %(filename)s:%(lineno)s] %(message)s')
+logging.basicConfig(
    format='[%(levelname)s %(asctime)s %(filename)s:%(lineno)s] %(message)s')
 logging.getLogger().setLevel(logging.INFO)
 class ImageClassifier():
    def __init__(self,
                 train_conf,
@ -58,18 +60,19 @@ class ImageClassifier():
        self.oversample = oversample
        self.is_color = is_color
-        self.transformer = image_util.ImageTransformer(is_color = is_color)
+        self.transformer = image_util.ImageTransformer(is_color=is_color)
-        self.transformer.set_transpose((2,0,1))
+        self.transformer.set_transpose((2, 0, 1))
        self.mean_file = mean_file
        mean = np.load(self.mean_file)['data_mean']
        mean = mean.reshape(3, self.crop_dims[0], self.crop_dims[1])
-        self.transformer.set_mean(mean) # mean pixel
+        self.transformer.set_mean(mean)  # mean pixel
        gpu = 1 if use_gpu else 0
        conf_args = "is_test=1,use_gpu=%d,is_predict=1" % (gpu)
        conf = parse_config(train_conf, conf_args)
        swig_paddle.initPaddle("--use_gpu=%d" % (gpu))
-        self.network = swig_paddle.GradientMachine.createFromConfigProto(conf.model_config)
+        self.network = swig_paddle.GradientMachine.createFromConfigProto(
            conf.model_config)
        assert isinstance(self.network, swig_paddle.GradientMachine)
        self.network.loadParameters(self.model_dir)
@ -90,14 +93,14 @@ class ImageClassifier():
            # image_util.resize_image: short side is self.resize_dim
            image = image_util.resize_image(image, self.resize_dim)
            image = np.array(image)
-            input = np.zeros((1, image.shape[0], image.shape[1], 3),
+            input = np.zeros(
-                             dtype=np.float32)
+                (1, image.shape[0], image.shape[1], 3), dtype=np.float32)
            input[0] = image.astype(np.float32)
            input = image_util.oversample(input, self.crop_dims)
        else:
            image = image.resize(self.crop_dims, Image.ANTIALIAS)
-            input = np.zeros((1, self.crop_dims[0], self.crop_dims[1], 3),
+            input = np.zeros(
-                             dtype=np.float32)
+                (1, self.crop_dims[0], self.crop_dims[1], 3), dtype=np.float32)
            input[0] = np.array(image).astype(np.float32)
        data_in = []
@ -133,22 +136,24 @@ class ImageClassifier():
        lab = np.argsort(-prob)
        logging.info("Label of %s is: %d", image, lab[0])
 if __name__ == '__main__':
-    image_size=32
+    image_size = 32
-    crop_size=32
+    crop_size = 32
-    multi_crop=True
+    multi_crop = True
-    config="vgg_16_cifar.py"
+    config = "vgg_16_cifar.py"
-    output_layer="__fc_layer_1__"
+    output_layer = "__fc_layer_1__"
-    mean_path="data/cifar-out/batches/batches.meta"
+    mean_path = "data/cifar-out/batches/batches.meta"
-    model_path=sys.argv[1]
+    model_path = sys.argv[1]
-    image=sys.argv[2]
+    image = sys.argv[2]
-    use_gpu=bool(int(sys.argv[3]))
+    use_gpu = bool(int(sys.argv[3]))
-
+
-    obj = ImageClassifier(train_conf=config,
+    obj = ImageClassifier(
-                          model_dir=model_path,
+        train_conf=config,
-                          resize_dim=image_size,
+        model_dir=model_path,
-                          crop_dim=crop_size,
+        resize_dim=image_size,
-                          mean_file=mean_path,
+        crop_dim=crop_size,
-                          use_gpu=use_gpu,
+        mean_file=mean_path,
-                          oversample=multi_crop)
+        use_gpu=use_gpu,
        oversample=multi_crop)
    obj.predict(image, output_layer)
--- a/demo/image_classification/preprocess.py
+++ b/demo/image_classification/preprocess.py
@ -19,22 +19,36 @@ from optparse import OptionParser
 def option_parser():
    parser = OptionParser(usage="usage: python preprcoess.py "\
                          "-i data_dir [options]")
-    parser.add_option("-i", "--input", action="store",
+    parser.add_option(
-                      dest="input", help="Input data directory.")
+        "-i",
-    parser.add_option("-s", "--size", action="store",
+        "--input",
-                      dest="size", help="Processed image size.")
+        action="store",
-    parser.add_option("-c", "--color", action="store",
+        dest="input",
-                      dest="color", help="whether to use color images.")
+        help="Input data directory.")
    parser.add_option(
        "-s",
        "--size",
        action="store",
        dest="size",
        help="Processed image size.")
    parser.add_option(
        "-c",
        "--color",
        action="store",
        dest="color",
        help="whether to use color images.")
    return parser.parse_args()
 if __name__ == '__main__':
-     options, args = option_parser()
+    options, args = option_parser()
-     data_dir = options.input
+    data_dir = options.input
-     processed_image_size = int(options.size)
+    processed_image_size = int(options.size)
-     color = options.color == "1"
+    color = options.color == "1"
-     data_creator = ImageClassificationDatasetCreater(data_dir,
+    data_creator = ImageClassificationDatasetCreater(
-                                                      processed_image_size,
+        data_dir, processed_image_size, color)
-                                                      color)
+    data_creator.train_list_name = "train.txt"
-     data_creator.num_per_batch = 1000
+    data_creator.test_list_name = "test.txt"
-     data_creator.overwrite = True
+    data_creator.num_per_batch = 1000
-     data_creator.create_batches()
+    data_creator.overwrite = True
    data_creator.create_batches()
--- a/demo/image_classification/preprocess.sh
+++ b/demo/image_classification/preprocess.sh
@ -17,3 +17,6 @@ set -e
 data_dir=./data/cifar-out
 python preprocess.py -i $data_dir -s 32 -c 1
 echo "data/cifar-out/batches/train.txt" > train.list
 echo "data/cifar-out/batches/test.txt" > test.list
--- a/demo/image_classification/vgg_16_cifar.py
+++ b/demo/image_classification/vgg_16_cifar.py
@ -18,36 +18,38 @@ is_predict = get_config_arg("is_predict", bool, False)
 ####################Data Configuration ##################
 if not is_predict:
-  data_dir='data/cifar-out/batches/'
+    data_dir = 'data/cifar-out/batches/'
-  meta_path=data_dir+'batches.meta'
+    meta_path = data_dir + 'batches.meta'
-
+
-  args = {'meta':meta_path,'mean_img_size': 32,
+    args = {
-          'img_size': 32,'num_classes': 10,
+        'meta': meta_path,
-          'use_jpeg': 1,'color': "color"}
+        'mean_img_size': 32,
-
+        'img_size': 32,
-  define_py_data_sources2(train_list=data_dir+"train.list",
+        'num_classes': 10,
-                          test_list=data_dir+'test.list',
+        'use_jpeg': 1,
-                          module='image_provider',
+        'color': "color"
-                          obj='processData',
+    }
-                          args=args)
+
    define_py_data_sources2(
        train_list="train.list",
        test_list="train.list",
        module='image_provider',
        obj='processData',
        args=args)
 ######################Algorithm Configuration #############
 settings(
-    batch_size = 128,
+    batch_size=128,
-    learning_rate = 0.1 / 128.0,
+    learning_rate=0.1 / 128.0,
-    learning_method = MomentumOptimizer(0.9),
+    learning_method=MomentumOptimizer(0.9),
-    regularization = L2Regularization(0.0005 * 128)
+    regularization=L2Regularization(0.0005 * 128))
 )
 #######################Network Configuration #############
-data_size=3*32*32
+data_size = 3 * 32 * 32
-label_size=10
+label_size = 10
-img = data_layer(name='image',
+img = data_layer(name='image', size=data_size)
                 size=data_size)
 # small_vgg is predefined in trainer_config_helpers.networks
-predict = small_vgg(input_image=img,
+predict = small_vgg(input_image=img, num_channels=3, num_classes=label_size)
                    num_channels=3,
                    num_classes=label_size)
 if not is_predict:
    lbl = data_layer(name="label", size=label_size)
--- a/demo/introduction/README.md
+++ b/demo/introduction/README.md
@ -1,4 +1,3 @@
 This folder contains scripts used in PaddlePaddle introduction.
 - use `bash train.sh` to train a simple linear regression model
 - use `python evaluate_model.py` to read model parameters. You can see that `w` and `b` are very close to [2, 0.3].
--- a/demo/introduction/dataprovider.py
+++ b/demo/introduction/dataprovider.py
@ -15,10 +15,10 @@
 from paddle.trainer.PyDataProvider2 import *
 import random
 # define data types of input: 2 real numbers
-@provider(input_types=[dense_vector(1), dense_vector(1)],use_seq=False)
+@provider(input_types=[dense_vector(1), dense_vector(1)], use_seq=False)
 def process(settings, input_file):
    for i in xrange(2000):
        x = random.random()
-        yield [x], [2*x+0.3]
+        yield [x], [2 * x + 0.3]
--- a/demo/introduction/evaluate_model.py
+++ b/demo/introduction/evaluate_model.py
@ -23,14 +23,17 @@ Usage:
 import numpy as np
 import os
 def load(file_name):
    with open(file_name, 'rb') as f:
-        f.read(16) # skip header for float type.
+        f.read(16)  # skip header for float type.
        return np.fromfile(f, dtype=np.float32)
 def main():
    print 'w=%.6f, b=%.6f from pass 29' % (load('output/pass-00029/w'),
-            load('output/pass-00029/b'))
+                                           load('output/pass-00029/b'))
 if __name__ == '__main__':
    main()
--- a/demo/introduction/trainer_config.py
+++ b/demo/introduction/trainer_config.py
@ -16,9 +16,14 @@ from paddle.trainer_config_helpers import *
 # 1. read data. Suppose you saved above python code as dataprovider.py
 data_file = 'empty.list'
-with open(data_file, 'w') as f: f.writelines(' ')
+with open(data_file, 'w') as f:
-define_py_data_sources2(train_list=data_file, test_list=None, 
+    f.writelines(' ')
-        module='dataprovider', obj='process',args={})
+define_py_data_sources2(
    train_list=data_file,
    test_list=None,
    module='dataprovider',
    obj='process',
    args={})
 # 2. learning algorithm
 settings(batch_size=12, learning_rate=1e-3, learning_method=MomentumOptimizer())
@ -26,7 +31,11 @@ settings(batch_size=12, learning_rate=1e-3, learning_method=MomentumOptimizer())
 # 3. Network configuration
 x = data_layer(name='x', size=1)
 y = data_layer(name='y', size=1)
-y_predict = fc_layer(input=x, param_attr=ParamAttr(name='w'), size=1, act=LinearActivation(), bias_attr=ParamAttr(name='b'))
+y_predict = fc_layer(
    input=x,
    param_attr=ParamAttr(name='w'),
    size=1,
    act=LinearActivation(),
    bias_attr=ParamAttr(name='b'))
 cost = regression_cost(input=y_predict, label=y)
 outputs(cost)
--- a/demo/mnist/data/generate_list.py
+++ b/demo/mnist/data/generate_list.py
@ -13,9 +13,9 @@
 # limitations under the License.
 o = open("./" + "train.list", "w")
-o.write("./data/raw_data/train" +"\n")
+o.write("./data/raw_data/train" + "\n")
 o.close()
 o = open("./" + "test.list", "w")
-o.write("./data/raw_data/t10k" +"\n")
+o.write("./data/raw_data/t10k" + "\n")
-o.close()
+o.close()
--- a/demo/mnist/data/get_mnist_data.sh
+++ b/demo/mnist/data/get_mnist_data.sh
@ -19,4 +19,3 @@ done
 cd $DIR
 rm -f *.list
 python generate_list.py
--- a/Show More
+++ b/Show More