From e222bc9e64b603e351d055a7592db0cd3cc3bb6b Mon Sep 17 00:00:00 2001 From: LDOUBLEV Date: Tue, 7 Jul 2020 02:35:17 +0000 Subject: [PATCH 1/4] set evaluation interval --- doc/doc_ch/config.md | 2 +- doc/doc_en/config_en.md | 2 +- tools/program.py | 18 ++++++++++++++++-- 3 files changed, 18 insertions(+), 4 deletions(-) diff --git a/doc/doc_ch/config.md b/doc/doc_ch/config.md index ae16263e..56e5c7f5 100644 --- a/doc/doc_ch/config.md +++ b/doc/doc_ch/config.md @@ -22,7 +22,7 @@ | print_batch_step | 设置打印log间隔 | 10 | \ | | save_model_dir | 设置模型保存路径 | output/{算法名称} | \ | | save_epoch_step | 设置模型保存间隔 | 3 | \ | -| eval_batch_step | 设置模型评估间隔 | 2000 | \ | +| eval_batch_step | 设置模型评估间隔 | 2000 或 [1000, 2000] | 2000 表示每2000次迭代评估一次,[1000, 2000]表示从1000次迭代开始,每2000次评估一次 | |train_batch_size_per_card | 设置训练时单卡batch size | 256 | \ | | test_batch_size_per_card | 设置评估时单卡batch size | 256 | \ | | image_shape | 设置输入图片尺寸 | [3, 32, 100] | \ | diff --git a/doc/doc_en/config_en.md b/doc/doc_en/config_en.md index b9ad0394..932de26c 100644 --- a/doc/doc_en/config_en.md +++ b/doc/doc_en/config_en.md @@ -22,7 +22,7 @@ Take `rec_chinese_lite_train.yml` as an example | print_batch_step | Set print log interval | 10 | \ | | save_model_dir | Set model save path | output/{model_name} | \ | | save_epoch_step | Set model save interval | 3 | \ | -| eval_batch_step | Set the model evaluation interval | 2000 | \ | +| eval_batch_step | Set the model evaluation interval |2000 or [1000, 2000] |runing evaluation every 2000 iters or evaluation is run every 2000 iterations after the 1000th iteration | |train_batch_size_per_card | Set the batch size during training | 256 | \ | | test_batch_size_per_card | Set the batch size during testing | 256 | \ | | image_shape | Set input image size | [3, 32, 100] | \ | diff --git a/tools/program.py b/tools/program.py index 3c71065a..57447caa 100755 --- a/tools/program.py +++ b/tools/program.py @@ -219,6 +219,13 @@ def train_eval_det_run(config, exe, train_info_dict, eval_info_dict): epoch_num = config['Global']['epoch_num'] print_batch_step = config['Global']['print_batch_step'] eval_batch_step = config['Global']['eval_batch_step'] + start_eval_step = 0 + if type(eval_batch_step) == list and len(eval_batch_step) >= 2: + start_eval_step = eval_batch_step[0] + eval_batch_step = eval_batch_step[1] + logger.info( + "During the training process, after the {}th iteration, an evaluation is run every {} iterations". + format(start_eval_step, eval_batch_step)) save_epoch_step = config['Global']['save_epoch_step'] save_model_dir = config['Global']['save_model_dir'] if not os.path.exists(save_model_dir): @@ -246,7 +253,7 @@ def train_eval_det_run(config, exe, train_info_dict, eval_info_dict): t2 = time.time() train_batch_elapse = t2 - t1 train_stats.update(stats) - if train_batch_id > 0 and train_batch_id \ + if train_batch_id > start_eval_step and train_batch_id \ % print_batch_step == 0: logs = train_stats.log() strs = 'epoch: {}, iter: {}, {}, time: {:.3f}'.format( @@ -286,6 +293,13 @@ def train_eval_rec_run(config, exe, train_info_dict, eval_info_dict): epoch_num = config['Global']['epoch_num'] print_batch_step = config['Global']['print_batch_step'] eval_batch_step = config['Global']['eval_batch_step'] + start_eval_step = 0 + if type(eval_batch_step) == list and len(eval_batch_step) >= 2: + start_eval_step = eval_batch_step[0] + eval_batch_step = eval_batch_step[1] + logger.info( + "During the training process, after the {}th iteration, an evaluation is run every {} iterations". + format(start_eval_step, eval_batch_step)) save_epoch_step = config['Global']['save_epoch_step'] save_model_dir = config['Global']['save_model_dir'] if not os.path.exists(save_model_dir): @@ -324,7 +338,7 @@ def train_eval_rec_run(config, exe, train_info_dict, eval_info_dict): train_batch_elapse = t2 - t1 stats = {'loss': loss, 'acc': acc} train_stats.update(stats) - if train_batch_id > 0 and train_batch_id \ + if train_batch_id > start_eval_step and train_batch_id \ % print_batch_step == 0: logs = train_stats.log() strs = 'epoch: {}, iter: {}, lr: {:.6f}, {}, time: {:.3f}'.format( From f5e0e9d050dda87690cfcd3c9b976bcc4e72a90c Mon Sep 17 00:00:00 2001 From: LDOUBLEV Date: Tue, 7 Jul 2020 02:51:50 +0000 Subject: [PATCH 2/4] update --- tools/program.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/tools/program.py b/tools/program.py index 57447caa..870d2700 100755 --- a/tools/program.py +++ b/tools/program.py @@ -253,7 +253,7 @@ def train_eval_det_run(config, exe, train_info_dict, eval_info_dict): t2 = time.time() train_batch_elapse = t2 - t1 train_stats.update(stats) - if train_batch_id > start_eval_step and train_batch_id \ + if train_batch_id > start_eval_step and (train_batch_id -start_eval_step) \ % print_batch_step == 0: logs = train_stats.log() strs = 'epoch: {}, iter: {}, {}, time: {:.3f}'.format( @@ -338,7 +338,7 @@ def train_eval_rec_run(config, exe, train_info_dict, eval_info_dict): train_batch_elapse = t2 - t1 stats = {'loss': loss, 'acc': acc} train_stats.update(stats) - if train_batch_id > start_eval_step and train_batch_id \ + if train_batch_id > start_eval_step and (train_batch_id - start_eval_step) \ % print_batch_step == 0: logs = train_stats.log() strs = 'epoch: {}, iter: {}, lr: {:.6f}, {}, time: {:.3f}'.format( From 738d787b019ea6723869239fee2ac9980799bbe0 Mon Sep 17 00:00:00 2001 From: LDOUBLEV Date: Tue, 7 Jul 2020 06:46:42 +0000 Subject: [PATCH 3/4] fix doc and modify config --- README.md | 1 + README_en.md | 3 +++ configs/det/det_mv3_db.yml | 5 +++-- configs/det/det_mv3_east.yml | 2 +- configs/det/det_r50_vd_db.yml | 2 +- configs/det/det_r50_vd_east.yml | 2 +- 6 files changed, 10 insertions(+), 5 deletions(-) diff --git a/README.md b/README.md index f4556441..6c85bbac 100644 --- a/README.md +++ b/README.md @@ -92,6 +92,7 @@ python3 tools/infer/predict_system.py --image_dir="./doc/imgs/11.jpg" --det_mode - [文本检测模型训练/评估/预测](./doc/doc_ch/detection.md) - [文本识别模型训练/评估/预测](./doc/doc_ch/recognition.md) - [基于预测引擎推理](./doc/doc_ch/inference.md) +- [yml配置文件参数介绍](./doc/doc_ch/config_ch.md) - [数据集](./doc/doc_ch/datasets.md) - [FAQ](#FAQ) - [联系我们](#欢迎加入PaddleOCR技术交流群) diff --git a/README_en.md b/README_en.md index 610c25b7..277f0d9f 100644 --- a/README_en.md +++ b/README_en.md @@ -92,7 +92,9 @@ For more text detection and recognition models, please refer to the document [In - [Text detection model training/evaluation/prediction](./doc/doc_en/detection_en.md) - [Text recognition model training/evaluation/prediction](./doc/doc_en/recognition_en.md) - [Inference](./doc/doc_en/inference_en.md) +- [Introduction of yml file](./doc/doc_en/config_en.md) - [Dataset](./doc/doc_en/datasets_en.md) +- [FAQ]((#FAQ) ## TEXT DETECTION ALGORITHM @@ -170,6 +172,7 @@ Please refer to the document for training guide and use of PaddleOCR text recogn ![](doc/imgs_results/chinese_db_crnn_server/2.jpg) ![](doc/imgs_results/chinese_db_crnn_server/8.jpg) + ## FAQ 1. Error when using attention-based recognition model: KeyError: 'predict' diff --git a/configs/det/det_mv3_db.yml b/configs/det/det_mv3_db.yml index 8efa66a9..f02c61c9 100755 --- a/configs/det/det_mv3_db.yml +++ b/configs/det/det_mv3_db.yml @@ -6,7 +6,8 @@ Global: print_batch_step: 2 save_model_dir: ./output/det_db/ save_epoch_step: 200 - eval_batch_step: 5000 + # evaluation is run every 2000 iterations after the 5000th iteration + eval_batch_step: [5000, 5000] train_batch_size_per_card: 16 test_batch_size_per_card: 16 image_shape: [3, 640, 640] @@ -50,4 +51,4 @@ PostProcess: thresh: 0.3 box_thresh: 0.7 max_candidates: 1000 - unclip_ratio: 2.0 \ No newline at end of file + unclip_ratio: 2.0 diff --git a/configs/det/det_mv3_east.yml b/configs/det/det_mv3_east.yml index b6f37256..67b82fff 100755 --- a/configs/det/det_mv3_east.yml +++ b/configs/det/det_mv3_east.yml @@ -6,7 +6,7 @@ Global: print_batch_step: 5 save_model_dir: ./output/det_east/ save_epoch_step: 200 - eval_batch_step: 5000 + eval_batch_step: [5000, 5000] train_batch_size_per_card: 16 test_batch_size_per_card: 16 image_shape: [3, 512, 512] diff --git a/configs/det/det_r50_vd_db.yml b/configs/det/det_r50_vd_db.yml index 6e3b3b9e..9a3b77e7 100755 --- a/configs/det/det_r50_vd_db.yml +++ b/configs/det/det_r50_vd_db.yml @@ -6,7 +6,7 @@ Global: print_batch_step: 2 save_model_dir: ./output/det_db/ save_epoch_step: 200 - eval_batch_step: 5000 + eval_batch_step: [5000, 5000] train_batch_size_per_card: 8 test_batch_size_per_card: 16 image_shape: [3, 640, 640] diff --git a/configs/det/det_r50_vd_east.yml b/configs/det/det_r50_vd_east.yml index bb16f9fa..8d868199 100755 --- a/configs/det/det_r50_vd_east.yml +++ b/configs/det/det_r50_vd_east.yml @@ -6,7 +6,7 @@ Global: print_batch_step: 5 save_model_dir: ./output/det_east/ save_epoch_step: 200 - eval_batch_step: 5000 + eval_batch_step: [5000, 5000] train_batch_size_per_card: 8 test_batch_size_per_card: 16 image_shape: [3, 512, 512] From 5e38ec57a61d404b73c26a666810bec0da8f4ec4 Mon Sep 17 00:00:00 2001 From: LDOUBLEV Date: Tue, 7 Jul 2020 11:34:10 +0000 Subject: [PATCH 4/4] update det yml file --- configs/det/det_mv3_db.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/configs/det/det_mv3_db.yml b/configs/det/det_mv3_db.yml index f02c61c9..caa7bd4f 100755 --- a/configs/det/det_mv3_db.yml +++ b/configs/det/det_mv3_db.yml @@ -6,8 +6,8 @@ Global: print_batch_step: 2 save_model_dir: ./output/det_db/ save_epoch_step: 200 - # evaluation is run every 2000 iterations after the 5000th iteration - eval_batch_step: [5000, 5000] + # evaluation is run every 5000 iterations after the 4000th iteration + eval_batch_step: [4000, 5000] train_batch_size_per_card: 16 test_batch_size_per_card: 16 image_shape: [3, 640, 640]