From fe016d321c4cc05db97e8c18db576a7e56d31cb4 Mon Sep 17 00:00:00 2001
From: jonyguo <guozhijian@huawei.com>
Date: Thu, 27 Aug 2020 21:32:31 +0800
Subject: [PATCH] update tiny bert script and readme

---
 model_zoo/official/nlp/tinybert/README.md          | 14 ++++++++------
 .../official/nlp/tinybert/run_general_distill.py   |  3 ++-
 .../official/nlp/tinybert/run_task_distill.py      |  3 ++-
 .../tinybert/scripts/run_distributed_gd_ascend.sh  |  3 ++-
 .../nlp/tinybert/scripts/run_distributed_gd_gpu.sh |  1 +
 .../nlp/tinybert/scripts/run_standalone_td.sh      |  3 ++-
 6 files changed, 17 insertions(+), 10 deletions(-)

diff --git a/model_zoo/official/nlp/tinybert/README.md b/model_zoo/official/nlp/tinybert/README.md
index 66950d4b54..a17bef5999 100644
--- a/model_zoo/official/nlp/tinybert/README.md
+++ b/model_zoo/official/nlp/tinybert/README.md
@@ -44,12 +44,12 @@ After installing MindSpore via the official website, you can start general disti
 # run standalone general distill example
 bash scripts/run_standalone_gd.sh 
 
-Before running the shell script, please set the `load_teacher_ckpt_path`, `data_dir` and `schema_dir` in the run_standalone_gd.sh file first. If running on GPU, please set the `device_target=GPU`.
+Before running the shell script, please set the `load_teacher_ckpt_path`, `data_dir`, `schema_dir` and `dataset_type` in the run_standalone_gd.sh file first. If running on GPU, please set the `device_target=GPU`.
 
 # For Ascend device, run distributed general distill example
 bash scripts/run_distributed_gd_ascend.sh 8 1 /path/hccl.json
 
-Before running the shell script, please set the `load_teacher_ckpt_path`, `data_dir` and `schema_dir` in the run_distributed_gd_ascend.sh file first.
+Before running the shell script, please set the `load_teacher_ckpt_path`, `data_dir`, `schema_dir` and `dataset_type` in the run_distributed_gd_ascend.sh file first.
 
 # For GPU device, run distributed general distill example
 bash scripts/run_distributed_gd_gpu.sh 8 1 /path/data/ /path/schema.json /path/teacher.ckpt
@@ -57,7 +57,7 @@ bash scripts/run_distributed_gd_gpu.sh 8 1 /path/data/ /path/schema.json /path/t
 # run task distill and evaluation example
 bash scripts/run_standalone_td.sh 
 
-Before running the shell script, please set the `task_name`, `load_teacher_ckpt_path`, `load_gd_ckpt_path`, `train_data_dir`, `eval_data_dir` and `schema_dir` in the run_standalone_td.sh file first.
+Before running the shell script, please set the `task_name`, `load_teacher_ckpt_path`, `load_gd_ckpt_path`, `train_data_dir`, `eval_data_dir`, `schema_dir` and `dataset_type` in the run_standalone_td.sh file first.
 If running on GPU, please set the `device_target=GPU`.
 ```
 
@@ -101,7 +101,7 @@ usage: run_general_distill.py   [--distribute DISTRIBUTE] [--epoch_size N] [----
                                 [--save_ckpt_path SAVE_CKPT_PATH]
                                 [--load_teacher_ckpt_path LOAD_TEACHER_CKPT_PATH]
                                 [--save_checkpoint_step N] [--max_ckpt_num N] 
-                                [--data_dir DATA_DIR] [--schema_dir SCHEMA_DIR] [train_steps N]
+                                [--data_dir DATA_DIR] [--schema_dir SCHEMA_DIR] [--dataset_type DATASET_TYPE] [train_steps N]
 
 options:
     --device_target            device where the code will be implemented: "Ascend" | "GPU", default is "Ascend"
@@ -118,6 +118,7 @@ options:
     --load_teacher_ckpt_path   path to load teacher checkpoint files: PATH, default is ""
     --data_dir                 path to dataset directory: PATH, default is ""
     --schema_dir               path to schema.json file, PATH, default is ""
+    --dataset_type             the dataset type which can be tfrecord/mindrecord, default is tfrecord
 ```
   
 ### Task Distill
@@ -132,7 +133,7 @@ usage: run_general_task.py  [--device_target DEVICE_TARGET] [--do_train DO_TRAIN
                             [--load_td1_ckpt_path LOAD_TD1_CKPT_PATH]
                             [--train_data_dir TRAIN_DATA_DIR]
                             [--eval_data_dir EVAL_DATA_DIR]
-                            [--task_name TASK_NAME] [--schema_dir SCHEMA_DIR]
+                            [--task_name TASK_NAME] [--schema_dir SCHEMA_DIR] [--dataset_type DATASET_TYPE]
 
 options:
     --device_target            device where the code will be implemented: "Ascend" | "GPU", default is "Ascend"
@@ -153,6 +154,7 @@ options:
     --eval_data_dir            path to eval dataset directory: PATH, default is ""
     --task_name                classification task: "SST-2" | "QNLI" | "MNLI", default is ""
     --schema_dir               path to schema.json file, PATH, default is ""
+    --dataset_type             the dataset type which can be tfrecord/mindrecord, default is tfrecord
 ```
 
 ## Options and Parameters
@@ -344,4 +346,4 @@ In run_general_distill.py, we set the random seed to make sure distribute traini
 
 # [ModelZoo Homepage](#contents)
  
-Please check the official [homepage](https://gitee.com/mindspore/mindspore/tree/master/model_zoo). 
\ No newline at end of file
+Please check the official [homepage](https://gitee.com/mindspore/mindspore/tree/master/model_zoo). 
diff --git a/model_zoo/official/nlp/tinybert/run_general_distill.py b/model_zoo/official/nlp/tinybert/run_general_distill.py
index dd4b36cd09..ff771428db 100644
--- a/model_zoo/official/nlp/tinybert/run_general_distill.py
+++ b/model_zoo/official/nlp/tinybert/run_general_distill.py
@@ -55,7 +55,8 @@ def run_general_distill():
     parser.add_argument("--load_teacher_ckpt_path", type=str, default="", help="Load checkpoint file path")
     parser.add_argument("--data_dir", type=str, default="", help="Data path, it is better to use absolute path")
     parser.add_argument("--schema_dir", type=str, default="", help="Schema path, it is better to use absolute path")
-    parser.add_argument("--dataset_type", type=str, default="tfrecord", help="dataset type, default is tfrecord")
+    parser.add_argument("--dataset_type", type=str, default="tfrecord",
+                        help="dataset type tfrecord/mindrecord, default is tfrecord")
     args_opt = parser.parse_args()
 
     context.set_context(mode=context.GRAPH_MODE, device_target=args_opt.device_target, device_id=args_opt.device_id)
diff --git a/model_zoo/official/nlp/tinybert/run_task_distill.py b/model_zoo/official/nlp/tinybert/run_task_distill.py
index bc3266d265..f6a504a1a3 100644
--- a/model_zoo/official/nlp/tinybert/run_task_distill.py
+++ b/model_zoo/official/nlp/tinybert/run_task_distill.py
@@ -68,7 +68,8 @@ def parse_args():
     parser.add_argument("--schema_dir", type=str, default="", help="Schema path, it is better to use absolute path")
     parser.add_argument("--task_name", type=str, default="", choices=["SST-2", "QNLI", "MNLI"],
                         help="The name of the task to train.")
-    parser.add_argument("--dataset_type", type=str, default="tfrecord", help="dataset type, default is tfrecord")
+    parser.add_argument("--dataset_type", type=str, default="tfrecord",
+                        help="dataset type tfrecord/mindrecord, default is tfrecord")
     args = parser.parse_args()
     return args
 
diff --git a/model_zoo/official/nlp/tinybert/scripts/run_distributed_gd_ascend.sh b/model_zoo/official/nlp/tinybert/scripts/run_distributed_gd_ascend.sh
index 79762a7bca..3b94ccab9b 100644
--- a/model_zoo/official/nlp/tinybert/scripts/run_distributed_gd_ascend.sh
+++ b/model_zoo/official/nlp/tinybert/scripts/run_distributed_gd_ascend.sh
@@ -65,6 +65,7 @@ do
     --max_ckpt_num=1 \
     --load_teacher_ckpt_path="" \
     --data_dir="" \
-    --schema_dir="" > log.txt 2>&1 &
+    --schema_dir="" \
+    --dataset_type="tfrecord" > log.txt 2>&1 &
     cd ../
 done
diff --git a/model_zoo/official/nlp/tinybert/scripts/run_distributed_gd_gpu.sh b/model_zoo/official/nlp/tinybert/scripts/run_distributed_gd_gpu.sh
index 33c6bd2036..ab7d2046ef 100644
--- a/model_zoo/official/nlp/tinybert/scripts/run_distributed_gd_gpu.sh
+++ b/model_zoo/official/nlp/tinybert/scripts/run_distributed_gd_gpu.sh
@@ -37,5 +37,6 @@ mpirun --allow-run-as-root -n $RANK_SIZE \
 	--save_ckpt_path="" \
 	--data_dir=$DATA_DIR \
 	--schema_dir=$SCHEMA_DIR \
+	--dataset_type="tfrecord" \
 	--enable_data_sink=False \
 	--load_teacher_ckpt_path=$TEACHER_CKPT_PATH > log.txt 2>&1 &
diff --git a/model_zoo/official/nlp/tinybert/scripts/run_standalone_td.sh b/model_zoo/official/nlp/tinybert/scripts/run_standalone_td.sh
index a8d0d4fc51..5c52c6e978 100644
--- a/model_zoo/official/nlp/tinybert/scripts/run_standalone_td.sh
+++ b/model_zoo/official/nlp/tinybert/scripts/run_standalone_td.sh
@@ -43,5 +43,6 @@ python ${PROJECT_DIR}/../run_task_distill.py \
     --load_td1_ckpt_path="" \
     --train_data_dir="" \
     --eval_data_dir="" \
-    --schema_dir="" > log.txt 2>&1 &
+    --schema_dir="" \
+    --dataset_type="tfrecord" > log.txt 2>&1 &