Skip to content

Commit 873bd7d

Browse files
committed
fix ernie output
1 parent d25802e commit 873bd7d

File tree

4 files changed

+6
-2
lines changed

4 files changed

+6
-2
lines changed

examples/config/ernie4_5/sft_argument_ernie4_5_0p3b.json

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -42,5 +42,6 @@
4242
"sequence_parallel": false,
4343
"report_to": "none",
4444
"convert_from_hf": true,
45+
"save_to_hf": true,
4546
"pp_seg_method": "layer:DecoderLayer|EmptyLayer"
4647
}

examples/config/ernie4_5_moe/sft_argument_ernie4_5_21b_a3b.json

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -41,5 +41,6 @@
4141
"sequence_parallel": true,
4242
"report_to": "none",
4343
"convert_from_hf": true,
44+
"save_to_hf": true,
4445
"pp_seg_method": "layer:DecoderLayer|EmptyLayer"
4546
}

paddleformers/transformers/ernie4_5/modeling.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -834,7 +834,8 @@ def forward(
834834

835835
# Pretrain & Eval must have labels
836836
assert labels is not None
837-
return self.criterion(logits, labels, loss_mask)
837+
loss, _ = self.criterion(logits, labels, loss_mask)
838+
return loss, logits
838839

839840

840841
class Ernie4_5ForCausalLMPipe(GeneralModelForCausalLMPipe):

paddleformers/transformers/ernie4_5_moe/modeling.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1157,7 +1157,8 @@ def forward(
11571157
# Pretrain & Eval must have labels
11581158
assert labels is not None
11591159

1160-
return self.criterion(logits, labels, loss_mask, router_loss=router_loss, mtp_logits=mtp_logits)
1160+
loss, _ = self.criterion(logits, labels, loss_mask, router_loss=router_loss, mtp_logits=mtp_logits)
1161+
return loss, logits
11611162

11621163

11631164
class Ernie4_5_MoeForCausalLMPipe(GeneralModelForCausalLMPipe):

0 commit comments

Comments
 (0)