update model (fix loss bug)
This commit is contained in:
parent
4ef9c41563
commit
a87f628400
@ -369,7 +369,8 @@ class Transformer(PreTrainedModel):
|
|||||||
|
|
||||||
if targets is not None:
|
if targets is not None:
|
||||||
logits = self.output(h)
|
logits = self.output(h)
|
||||||
self.last_loss = F.cross_entropy(logits.view(-1, logits.size(-1)), targets.view(-1), ignore_index=-1)
|
self.last_loss = F.cross_entropy(logits.view(-1, logits.size(-1)), targets.view(-1),
|
||||||
|
ignore_index=0, reduction='none')
|
||||||
else:
|
else:
|
||||||
logits = self.output(h[:, [-1], :])
|
logits = self.output(h[:, [-1], :])
|
||||||
self.last_loss = None
|
self.last_loss = None
|
||||||
|
Loading…
x
Reference in New Issue
Block a user