Refine cpp demo flags vocab_dir to vocab_file (#1150)

FrostML · web-flow · commit 7d2f50e4f2ea · 2021-10-14T14:52:42.000+08:00
diff --git a/docs/advanced_guide/fastertransformer.rst b/docs/advanced_guide/fastertransformer.rst
@@ -292,7 +292,7 @@ PaddleNLP 准备
 .. code-block::
 
     cd bin/
-    ./transformer_e2e -batch_size <batch_size> -gpu_id <gpu_id> -model_dir <model_directory> -vocab_dir <dict_directory> -data_dir <input_data>
+    ./transformer_e2e -batch_size <batch_size> -gpu_id <gpu_id> -model_dir <model_directory> -vocab_file <dict_file> -data_file <input_data>
 
 举例说明：
 
@@ -301,7 +301,7 @@ PaddleNLP 准备
     cd bin/
     # 执行 decoding_gemm 目的是基于当前环境、配置，提前确定一个性能最佳的矩阵乘算法，不是必要的步骤
     ../third-party/build/fastertransformer/bin/decoding_gemm 8 5 8 64 38512 256 512 0
-    ./transformer_e2e -batch_size 8 -gpu_id 0 -model_dir ./infer_model/ -vocab_dir DATA_HOME/WMT14ende/WMT14.en-de/wmt14_ende_data_bpe/vocab_all.bpe.33708 -data_dir DATA_HOME/WMT14ende/WMT14.en-de/wmt14_ende_data_bpe/newstest2014.tok.bpe.33708.en
+    ./transformer_e2e -batch_size 8 -gpu_id 0 -model_dir ./infer_model/ -vocab_file DATA_HOME/WMT14ende/WMT14.en-de/wmt14_ende_data_bpe/vocab_all.bpe.33708 -data_file DATA_HOME/WMT14ende/WMT14.en-de/wmt14_ende_data_bpe/newstest2014.tok.bpe.33708.en
 
 其中：
 
@@ -344,4 +344,4 @@ PaddleNLP 准备
 .. code-block::
 
     cd bin/
-    ./gpt -batch_size 1 -gpu_id 0 -model_dir path/to/model -vocab_dir path/to/vocab -start_token "<|endoftext|>" -end_token "<|endoftext|>"
+    ./gpt -batch_size 1 -gpu_id 0 -model_dir path/to/model -vocab_file path/to/vocab -start_token "<|endoftext|>" -end_token "<|endoftext|>"
diff --git a/examples/machine_translation/transformer/deploy/cpp/README.md b/examples/machine_translation/transformer/deploy/cpp/README.md
@@ -62,7 +62,7 @@ bash run.sh
 
 ``` sh
 export CUDA_VISIBLE_DEVICES=0
-./build/bin/transformer_e2e -batch_size 8 -device gpu -gpu_id 0 -model_dir ./infer_model/ -vocab_dir /root/.paddlenlp/datasets/WMT14ende/WMT14.en-de/wmt14_ende_data_bpe/vocab_all.bpe.33708 -data_dir /root/.paddlenlp/datasets/WMT14ende/WMT14.en-de/wmt14_ende_data_bpe/newstest2014.tok.bpe.33708.en
+./build/bin/transformer_e2e -batch_size 8 -device gpu -gpu_id 0 -model_dir ./infer_model/ -vocab_file /root/.paddlenlp/datasets/WMT14ende/WMT14.en-de/wmt14_ende_data_bpe/vocab_all.bpe.33708 -data_file /root/.paddlenlp/datasets/WMT14ende/WMT14.en-de/wmt14_ende_data_bpe/newstest2014.tok.bpe.33708.en
 ```
 
 各个参数解释如下：
@@ -72,8 +72,8 @@ export CUDA_VISIBLE_DEVICES=0
 * `-use_mkl`: 是否使用 mkl，设置代表使用 mkl，不设置则不使用 mkl。仅在使用 cpu 进行预测的时候有效。
 * `-threads`: 仅在使用 mkl 的时候起效，用于指定计算 math 库时的线程数。
 * `-model_dir`: 导出的模型的位置。
-* `-vocab_dir`: 词表的位置。
-* `-data_dir`: 推理用的数据的位置。
+* `-vocab_file`: 词表文件的位置。
+* `-data_file`: 推理用的数据的位置。
 
 英德翻译的结果会保存到 `predict.txt` 文件中。
 
diff --git a/examples/machine_translation/transformer/deploy/cpp/run_impl.sh b/examples/machine_translation/transformer/deploy/cpp/run_impl.sh
@@ -30,4 +30,4 @@ cmake .. -DPADDLE_LIB=${LIB_DIR} \
 
 make -j
 
-./${DEMO_NAME} -batch_size 8 -device ${DEVICE} -gpu_id 0 -model_dir ${MODEL_FILE_DIR} -vocab_dir ${VOCAB_DIR} -data_dir ${DATA_DIR}
+./${DEMO_NAME} -batch_size 8 -device ${DEVICE} -gpu_id 0 -model_dir ${MODEL_FILE_DIR} -vocab_file ${VOCAB_DIR} -data_file ${DATA_DIR}
diff --git a/examples/machine_translation/transformer/deploy/cpp/transformer_e2e.cc b/examples/machine_translation/transformer/deploy/cpp/transformer_e2e.cc
@@ -30,18 +30,18 @@ DEFINE_int32(threads,
 DEFINE_string(model_dir,
               "./infer_model/",
               "The directory to the inference model. ");
-DEFINE_string(vocab_dir,
+DEFINE_string(vocab_file,
               "./vocab_all.bpe.33708",
-              "The directory to the vocabulary file. ");
-DEFINE_string(data_dir,
+              "The path to the vocabulary file. ");
+DEFINE_string(data_file,
               "./newstest2014.tok.bpe.33708.en",
-              "The directory to the input data. ");
+              "The path to the input data file. ");
 
 using namespace paddle_infer;
 
 std::string model_dir = "";
-std::string vocab_dir = "";
-std::string data_dir = "";
+std::string vocab_file = "";
+std::string data_file = "";
 
 const int EOS_IDX = 1;
 const int PAD_IDX = 0;
@@ -140,7 +140,7 @@ class DataReader {
   }
 
   bool GetWordDict() {
-    std::ifstream fin(vocab_dir);
+    std::ifstream fin(vocab_file);
     std::string line;
     int k = 0;
     while (std::getline(fin, line)) {
@@ -239,7 +239,7 @@ void Main(
   // can turn off the IR optimization for same results as following:
   // config.SwitchIrOptim(false);
   auto predictor = CreatePredictor(config);
-  DataReader reader(data_dir);
+  DataReader reader(data_file);
   reader.GetWordDict();
 
   double whole_time = 0;
@@ -281,8 +281,8 @@ int main(int argc, char** argv) {
   gpu_id = FLAGS_gpu_id;
 
   model_dir = FLAGS_model_dir;
-  vocab_dir = FLAGS_vocab_dir;
-  data_dir = FLAGS_data_dir;
+  vocab_file = FLAGS_vocab_file;
+  data_file = FLAGS_data_file;
 
   paddle::inference::Main(
       batch_size, FLAGS_device, gpu_id, FLAGS_use_mkl, FLAGS_threads);
diff --git a/paddlenlp/ops/README.md b/paddlenlp/ops/README.md
@@ -277,7 +277,7 @@ cd ../
 
 ``` sh
 cd bin/
-./transformer_e2e -batch_size <batch_size> -gpu_id <gpu_id> -model_dir <model_directory> -vocab_dir <dict_directory> -data_dir <input_data>
+./transformer_e2e -batch_size <batch_size> -gpu_id <gpu_id> -model_dir <model_directory> -vocab_file <dict_file> -data_file <input_data>
 ```
 
 举例说明：
@@ -286,7 +286,7 @@ cd bin/
 cd bin/
 # 执行 decoding_gemm 目的是基于当前环境、配置，提前确定一个性能最佳的矩阵乘算法，不是必要的步骤
 ../third-party/build/fastertransformer/bin/decoding_gemm 8 5 8 64 38512 256 512 0
-./transformer_e2e -batch_size 8 -gpu_id 0 -model_dir ./infer_model/ -vocab_dir DATA_HOME/WMT14ende/WMT14.en-de/wmt14_ende_data_bpe/vocab_all.bpe.33708 -data_dir DATA_HOME/WMT14ende/WMT14.en-de/wmt14_ende_data_bpe/newstest2014.tok.bpe.33708.en
+./transformer_e2e -batch_size 8 -gpu_id 0 -model_dir ./infer_model/ -vocab_file DATA_HOME/WMT14ende/WMT14.en-de/wmt14_ende_data_bpe/vocab_all.bpe.33708 -data_file DATA_HOME/WMT14ende/WMT14.en-de/wmt14_ende_data_bpe/newstest2014.tok.bpe.33708.en
 ```
 
 其中：
@@ -326,5 +326,5 @@ python ./faster_transformer/sample/gpt_export_model_sample.py --model_name_or_pa
 
 ``` sh
 cd bin/
-./gpt -batch_size 1 -gpu_id 0 -model_dir path/to/model -vocab_dir path/to/vocab -start_token "<|endoftext|>" -end_token "<|endoftext|>"
+./gpt -batch_size 1 -gpu_id 0 -model_dir path/to/model -vocab_file path/to/vocab -start_token "<|endoftext|>" -end_token "<|endoftext|>"
 ```
diff --git a/paddlenlp/ops/faster_transformer/src/demo/gpt.cc b/paddlenlp/ops/faster_transformer/src/demo/gpt.cc
@@ -29,16 +29,16 @@ DEFINE_int32(gpu_id, 0, "The gpu id to do inference. ");
 DEFINE_string(model_dir,
               "./infer_model/",
               "The directory to the inference model. ");
-DEFINE_string(vocab_dir,
-              "./infer_model/",
-              "The directory to the vocabulary file. ");
+DEFINE_string(vocab_file,
+              "./infer_model/vocab.txt",
+              "The path to the vocabulary file. ");
 DEFINE_string(start_token, "<|endoftext|>", "The start token of GPT.");
 DEFINE_string(end_token, "<|endoftext|>", "The end token of GPT.");
 
 using namespace paddle_infer;
 
 std::string model_dir = "";
-std::string vocab_dir = "";
+std::string vocab_file = "";
 
 const int BOS_IDX = 50256;
 const int EOS_IDX = 50256;
@@ -168,7 +168,7 @@ class DataReader {
   }
 
   bool GetWordDict() {
-    std::ifstream fin(vocab_dir);
+    std::ifstream fin(vocab_file);
     std::string line;
     int k = 0;
     while (std::getline(fin, line)) {
@@ -296,7 +296,7 @@ int main(int argc, char** argv) {
   gpu_id = FLAGS_gpu_id;
 
   model_dir = FLAGS_model_dir;
-  vocab_dir = FLAGS_vocab_dir;
+  vocab_file = FLAGS_vocab_file;
 
   paddle::inference::Main(batch_size,
                           gpu_id,
diff --git a/paddlenlp/ops/faster_transformer/src/demo/transformer_e2e.cc b/paddlenlp/ops/faster_transformer/src/demo/transformer_e2e.cc
@@ -38,16 +38,16 @@ DEFINE_int32(gpu_id, 0, "The gpu id to do inference. ");
 DEFINE_string(model_dir,
               "./infer_model/",
               "The directory to the inference model. ");
-DEFINE_string(vocab_dir,
+DEFINE_string(vocab_file,
               "./vocab_all.bpe.33708",
-              "The directory to the vocabulary file. ");
-DEFINE_string(data_dir,
+              "The path to the vocabulary file. ");
+DEFINE_string(data_file,
               "./newstest2014.tok.bpe.33708.en",
-              "The directory to the input data. ");
+              "The path to the input data file. ");
 
 std::string model_dir = "";
-std::string vocab_dir = "";
-std::string data_dir = "";
+std::string vocab_file = "";
+std::string data_file = "";
 
 const int EOS_IDX = 1;
 const int PAD_IDX = 0;
@@ -145,7 +145,7 @@ class DataReader {
   }
 
   bool GetWordDict() {
-    std::ifstream fin(vocab_dir);
+    std::ifstream fin(vocab_file);
     std::string line;
     int k = 0;
     while (std::getline(fin, line)) {
@@ -219,7 +219,7 @@ void Main(int batch_size, int gpu_id) {
   // can turn off the IR optimization for same results as following:
   // config.SwitchIrOptim(false);
   auto predictor = CreatePredictor(config);
-  DataReader reader(data_dir);
+  DataReader reader(data_file);
   reader.GetWordDict();
 
   double whole_time = 0;
@@ -263,8 +263,8 @@ int main(int argc, char** argv) {
   gpu_id = FLAGS_gpu_id;
 
   model_dir = FLAGS_model_dir;
-  vocab_dir = FLAGS_vocab_dir;
-  data_dir = FLAGS_data_dir;
+  vocab_file = FLAGS_vocab_file;
+  data_file = FLAGS_data_file;
 
   paddle::inference::Main(batch_size, gpu_id);
 

Original file line number	Diff line number	Diff line change
`@@ -30,4 +30,4 @@ cmake .. -DPADDLE_LIB=${LIB_DIR} \`
`30`	`30`
`31`	`31`	`make -j`
`32`	`32`
`33`		`-./${DEMO_NAME} -batch_size 8 -device ${DEVICE} -gpu_id 0 -model_dir ${MODEL_FILE_DIR} -vocab_dir ${VOCAB_DIR} -data_dir ${DATA_DIR}`
	`33`	`+./${DEMO_NAME} -batch_size 8 -device ${DEVICE} -gpu_id 0 -model_dir ${MODEL_FILE_DIR} -vocab_file ${VOCAB_DIR} -data_file ${DATA_DIR}`