PaddleOCR/configs/rec/rec_icdar15_train.yml

101 lines
2.2 KiB
YAML
Raw Normal View History

2020-12-11 17:50:01 +08:00
Global:
use_gpu: true
epoch_num: 72
log_smooth_window: 20
print_batch_step: 10
save_model_dir: ./output/rec/ic15/
save_epoch_step: 3
# evaluation is run every 2000 iterations
eval_batch_step: [0, 2000]
cal_metric_during_train: True
pretrained_model:
checkpoints:
2021-08-05 14:18:44 +08:00
save_inference_dir: ./
2020-12-11 17:50:01 +08:00
use_visualdl: False
infer_img: doc/imgs_words_en/word_10.png
# for data or label process
character_dict_path: ppocr/utils/ic15_dict.txt
character_type: ch
max_text_length: 25
infer_mode: False
use_space_char: False
2021-04-25 20:49:45 +08:00
save_res_path: ./output/rec/predicts_ic15.txt
2020-12-11 17:50:01 +08:00
Optimizer:
name: Adam
beta1: 0.9
beta2: 0.999
lr:
learning_rate: 0.0005
regularizer:
name: 'L2'
factor: 0
Architecture:
model_type: rec
algorithm: CRNN
Transform:
Backbone:
2020-12-15 20:32:18 +08:00
name: MobileNetV3
scale: 0.5
model_name: large
2020-12-11 17:50:01 +08:00
Neck:
name: SequenceEncoder
encoder_type: rnn
2020-12-15 20:32:18 +08:00
hidden_size: 96
2020-12-11 17:50:01 +08:00
Head:
name: CTCHead
fc_decay: 0
Loss:
name: CTCLoss
PostProcess:
name: CTCLabelDecode
Metric:
name: RecMetric
main_indicator: acc
Train:
dataset:
name: SimpleDataSet
2021-08-05 14:18:44 +08:00
data_dir: ./train_data/ic15_data/
label_file_list: ["./train_data/ic15_data/rec_gt_train.txt"]
2020-12-11 17:50:01 +08:00
transforms:
- DecodeImage: # load image
img_mode: BGR
channel_first: False
- CTCLabelEncode: # Class handling label
- RecResizeImg:
image_shape: [3, 32, 100]
- KeepKeys:
keep_keys: ['image', 'label', 'length'] # dataloader will return list in this order
loader:
shuffle: True
batch_size_per_card: 256
drop_last: True
num_workers: 8
use_shared_memory: False
2020-12-11 17:50:01 +08:00
Eval:
dataset:
name: SimpleDataSet
2021-08-05 14:18:44 +08:00
data_dir: ./train_data/ic15_data
label_file_list: ["./train_data/ic15_data/rec_gt_test.txt"]
2020-12-11 17:50:01 +08:00
transforms:
- DecodeImage: # load image
img_mode: BGR
channel_first: False
- CTCLabelEncode: # Class handling label
- RecResizeImg:
image_shape: [3, 32, 100]
- KeepKeys:
keep_keys: ['image', 'label', 'length'] # dataloader will return list in this order
loader:
shuffle: False
drop_last: False
batch_size_per_card: 256
num_workers: 4
use_shared_memory: False