Skip to content

Commit 3182c3e

Browse files
committed
Rectify code of the LayoutLM series models and adjust it to amp_level mode.
1 parent c698646 commit 3182c3e

18 files changed

+71
-121
lines changed

configs/kie/layoutlmv3/README.md

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -144,7 +144,7 @@ Apart from the dataset setting, please also check the following important args:
144144
system:
145145
mode:
146146
distribute: False # `True` for distributed training, `False` for standalone training
147-
amp_level: 'O0'
147+
amp_level: 'O3'
148148
seed: 42
149149
val_while_train: True # Validate while training
150150
drop_overflow_update: False
@@ -157,7 +157,6 @@ model:
157157
name: TokenClassificationHead
158158
num_classes: 7
159159
use_visual_backbone: True
160-
use_float16: True
161160
pretrained:
162161
...
163162
train:

configs/kie/layoutlmv3/ser_layoutlmv3_xfund_zh.yaml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
system:
22
mode: 0 # 0 for graph mode, 1 for pynative mode in MindSpore
33
distribute: False
4-
amp_level: "O0"
4+
amp_level: "O3"
55
seed: 42
66
log_interval: 10
77
val_start_epoch: 50
@@ -17,7 +17,6 @@ model:
1717
name: TokenClassificationHead
1818
num_classes: 7
1919
use_visual_backbone: True
20-
use_float16: True
2120
pretrained:
2221

2322
postprocess:

configs/kie/layoutxlm/re_layoutxlm_xfund_zh.yaml

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
system:
22
mode: 0 # 0 for graph mode, 1 for pynative mode in MindSpore
33
distribute: False
4-
amp_level: 'O0'
4+
amp_level: 'O3'
55
seed: 42
66
log_interval: 10
77
val_while_train: True
@@ -16,11 +16,9 @@ model:
1616
pretrained: True
1717
num_classes: &num_classes 7
1818
use_visual_backbone: True
19-
use_float16: True
2019
head:
2120
name: RelationExtractionHead
2221
use_visual_backbone: True
23-
use_float16: True
2422
pretrained:
2523

2624
postprocess:

configs/kie/layoutxlm/ser_layoutxlm_xfund_zh.yaml

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
system:
22
mode: 0 # 0 for graph mode, 1 for pynative mode in MindSpore
33
distribute: False
4-
amp_level: 'O0'
4+
amp_level: 'O3'
55
seed: 42
66
log_interval: 10
77
val_while_train: True
@@ -15,12 +15,10 @@ model:
1515
pretrained: True
1616
num_classes: &num_classes 7
1717
use_visual_backbone: True
18-
use_float16: True
1918
head :
2019
name: TokenClassificationHead
2120
num_classes: 7
2221
use_visual_backbone: True
23-
use_float16: True
2422
pretrained:
2523

2624
postprocess:

configs/kie/vi_layoutxlm/README.md

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -159,7 +159,7 @@ Apart from the dataset setting, please also check the following important args:
159159
system:
160160
mode:
161161
distribute: False # `True` for distributed training, `False` for standalone training
162-
amp_level: 'O0'
162+
amp_level: 'O3'
163163
seed: 42
164164
val_while_train: True # Validate while training
165165
drop_overflow_update: False
@@ -171,12 +171,10 @@ model:
171171
pretrained: True
172172
num_classes: &num_classes 7
173173
use_visual_backbone: False
174-
use_float16: True
175174
head :
176175
name: TokenClassificationHead
177176
num_classes: 7
178177
use_visual_backbone: False
179-
use_float16: True
180178
pretrained:
181179
...
182180
train:

configs/kie/vi_layoutxlm/README_CN.md

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -156,7 +156,7 @@ eval:
156156
system:
157157
mode:
158158
distribute: False # 分布式训练为True,单卡训练为False
159-
amp_level: 'O0'
159+
amp_level: 'O3'
160160
seed: 42
161161
val_while_train: True # 边训练边验证
162162
drop_overflow_update: False
@@ -168,12 +168,10 @@ model:
168168
pretrained: True
169169
num_classes: &num_classes 7
170170
use_visual_backbone: False
171-
use_float16: True
172171
head :
173172
name: TokenClassificationHead
174173
num_classes: 7
175174
use_visual_backbone: False
176-
use_float16: True
177175
pretrained:
178176
...
179177
train:

configs/kie/vi_layoutxlm/re_vi_layoutxlm_xfund_zh.yaml

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
system:
22
mode: 0 # 0 for graph mode, 1 for pynative mode in MindSpore
33
distribute: False
4-
amp_level: "O0"
4+
amp_level: "O3"
55
seed: 42
66
log_interval: 10
77
val_while_train: True
@@ -16,11 +16,9 @@ model:
1616
pretrained: True
1717
num_classes: &num_classes 7
1818
use_visual_backbone: False
19-
use_float16: True
2019
head:
2120
name: RelationExtractionHead
2221
use_visual_backbone: False
23-
use_float16: True
2422
pretrained:
2523

2624
postprocess:
@@ -90,11 +88,11 @@ train:
9088
"bbox",
9189
"attention_mask",
9290
"token_type_ids",
93-
"image",
9491
"question",
9592
"question_label",
9693
"answer",
9794
"answer_label",
95+
"image",
9896
"relation_label",
9997
]
10098
net_input_column_index: [0, 1, 2, 3, 4, 5, 6, 7, 8] # input indices for network forward func in output_columns

configs/kie/vi_layoutxlm/ser_vi_layoutxlm_xfund_zh.yaml

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
system:
22
mode: 0 # 0 for graph mode, 1 for pynative mode in MindSpore
33
distribute: False
4-
amp_level: 'O0'
4+
amp_level: 'O3'
55
seed: 42
66
log_interval: 10
77
val_while_train: True
@@ -15,12 +15,10 @@ model:
1515
pretrained: True
1616
num_classes: &num_classes 7
1717
use_visual_backbone: False
18-
use_float16: True
1918
head :
2019
name: TokenClassificationHead
2120
num_classes: 7
2221
use_visual_backbone: False
23-
use_float16: True
2422
pretrained:
2523

2624
postprocess:

mindocr/losses/kie_loss.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -28,6 +28,6 @@ def __init__(self, **kwargs):
2828
super().__init__()
2929
self.loss_fct = nn.CrossEntropyLoss()
3030

31-
def construct(self, predicts, attention_mask, labels):
31+
def construct(self, predicts, labels):
3232
loss = self.loss_fct(predicts.transpose(0, 2, 1), labels.astype(ms.int32))
3333
return loss

mindocr/models/backbones/layoutlmv3/configuration.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3,9 +3,8 @@
33

44
@dataclass
55
class LayoutLMv3PretrainedConfig:
6-
def __init__(self, use_float16=False):
6+
def __init__(self):
77
pretrained_config = {
8-
"use_float16": use_float16,
98
"fast_qkv": False,
109
"vocab_size": 250002,
1110
"hidden_size": 768,

0 commit comments

Comments
 (0)