@@ -57,31 +57,20 @@ train:
57
57
label_file : XFUND/zh_train/train.json
58
58
sample_ratio : 1.0
59
59
transform_pipeline :
60
- - DecodeImage :
61
- img_mode : RGB
62
- to_float32 : False
63
60
- VQATokenLabelEncode :
64
61
contains_re : False
65
- algorithm : &algorithm LayoutXLM
62
+ algorithm : &algorithm VI- LayoutXLM
66
63
class_path : *class_path
67
64
order_method : tb-yx
68
65
- VQATokenPad :
69
66
max_seq_len : &max_seq_len 512
70
67
return_attention_mask : True
71
68
- VQASerTokenChunk :
72
69
max_seq_len : *max_seq_len
73
- - LayoutResize :
74
- size : [ 224, 224 ]
75
- - NormalizeImage :
76
- bgr_to_rgb : False
77
- is_hwc : True
78
- mean : imagenet
79
- std : imagenet
80
- - ToCHWImage :
81
70
# the order of the dataloader list, matching the network input and the input labels for the loss function, and optional data for debug/visualize
82
- output_columns : [ 'input_ids', 'bbox','attention_mask','token_type_ids', 'image ', 'labels' ]
83
- net_input_column_index : [ 0, 1, 2, 3, 4 ] # input indices for network forward func in output_columns
84
- label_column_index : [ 2, 5 ] # input indices marked as label
71
+ output_columns : [ 'input_ids', 'bbox', 'attention_mask', 'token_type_ids ', 'labels' ]
72
+ net_input_column_index : [ 0, 1, 2, 3 ] # input indices for network forward func in output_columns
73
+ label_column_index : [ 4 ] # input indices marked as label
85
74
86
75
loader :
87
76
shuffle : True
100
89
sample_ratio : 1.0
101
90
shuffle : False
102
91
transform_pipeline :
103
- - DecodeImage :
104
- img_mode : RGB
105
- to_float32 : False
106
92
- VQATokenLabelEncode :
107
93
contains_re : False
108
94
algorithm : *algorithm
@@ -113,18 +99,10 @@ eval:
113
99
return_attention_mask : True
114
100
- VQASerTokenChunk :
115
101
max_seq_len : *max_seq_len
116
- - LayoutResize :
117
- size : [ 224, 224 ]
118
- - NormalizeImage :
119
- bgr_to_rgb : False
120
- is_hwc : True
121
- mean : imagenet
122
- std : imagenet
123
- - ToCHWImage :
124
102
# the order of the dataloader list, matching the network input and the labels for evaluation
125
- output_columns : [ 'input_ids', 'bbox', 'attention_mask','token_type_ids','image ', 'labels' ]
126
- net_input_column_index : [ 0, 1, 2, 3, 4 ] # input indices for network forward func in output_columns
127
- label_column_index : [ 2, 5 ] # input indices marked as label
103
+ output_columns : [ 'input_ids', 'bbox', 'attention_mask', 'token_type_ids', 'labels' ]
104
+ net_input_column_index : [ 0, 1, 2, 3 ] # input indices for network forward func in output_columns
105
+ label_column_index : [ 4 ] # input indices marked as label
128
106
129
107
loader :
130
108
shuffle : False
0 commit comments