@@ -57,31 +57,20 @@ train:
5757 label_file : XFUND/zh_train/train.json
5858 sample_ratio : 1.0
5959 transform_pipeline :
60- - DecodeImage :
61- img_mode : RGB
62- to_float32 : False
6360 - VQATokenLabelEncode :
6461 contains_re : False
65- algorithm : &algorithm LayoutXLM
62+ algorithm : &algorithm VI- LayoutXLM
6663 class_path : *class_path
6764 order_method : tb-yx
6865 - VQATokenPad :
6966 max_seq_len : &max_seq_len 512
7067 return_attention_mask : True
7168 - VQASerTokenChunk :
7269 max_seq_len : *max_seq_len
73- - LayoutResize :
74- size : [ 224, 224 ]
75- - NormalizeImage :
76- bgr_to_rgb : False
77- is_hwc : True
78- mean : imagenet
79- std : imagenet
80- - ToCHWImage :
8170 # the order of the dataloader list, matching the network input and the input labels for the loss function, and optional data for debug/visualize
82- output_columns : [ 'input_ids', 'bbox','attention_mask','token_type_ids', 'image ', 'labels' ]
83- net_input_column_index : [ 0, 1, 2, 3, 4 ] # input indices for network forward func in output_columns
84- label_column_index : [ 2, 5 ] # input indices marked as label
71+ output_columns : [ 'input_ids', 'bbox', 'attention_mask', 'token_type_ids ', 'labels' ]
72+ net_input_column_index : [ 0, 1, 2, 3 ] # input indices for network forward func in output_columns
73+ label_column_index : [ 4 ] # input indices marked as label
8574
8675 loader :
8776 shuffle : True
10089 sample_ratio : 1.0
10190 shuffle : False
10291 transform_pipeline :
103- - DecodeImage :
104- img_mode : RGB
105- to_float32 : False
10692 - VQATokenLabelEncode :
10793 contains_re : False
10894 algorithm : *algorithm
@@ -113,18 +99,10 @@ eval:
11399 return_attention_mask : True
114100 - VQASerTokenChunk :
115101 max_seq_len : *max_seq_len
116- - LayoutResize :
117- size : [ 224, 224 ]
118- - NormalizeImage :
119- bgr_to_rgb : False
120- is_hwc : True
121- mean : imagenet
122- std : imagenet
123- - ToCHWImage :
124102 # the order of the dataloader list, matching the network input and the labels for evaluation
125- output_columns : [ 'input_ids', 'bbox', 'attention_mask','token_type_ids','image ', 'labels' ]
126- net_input_column_index : [ 0, 1, 2, 3, 4 ] # input indices for network forward func in output_columns
127- label_column_index : [ 2, 5 ] # input indices marked as label
103+ output_columns : [ 'input_ids', 'bbox', 'attention_mask', 'token_type_ids', 'labels' ]
104+ net_input_column_index : [ 0, 1, 2, 3 ] # input indices for network forward func in output_columns
105+ label_column_index : [ 4 ] # input indices marked as label
128106
129107 loader :
130108 shuffle : False
0 commit comments