Crystalcareai
commited on
Update modeling_quiet.py
Browse files- modeling_quiet.py +2 -2
modeling_quiet.py
CHANGED
@@ -1737,10 +1737,10 @@ class QuietForCausalLM(QuietPreTrainedModel, GenerationMixin):
|
|
1737 |
shift_labels = labels[..., 1 + shift_amount:].contiguous()
|
1738 |
# Flatten the tokens
|
1739 |
loss_fct = CrossEntropyLoss(reduction="none")
|
1740 |
-
print("Shift logits before:", shift_logits)
|
1741 |
shift_logits = shift_logits.view(-1, self.config.vocab_size)
|
1742 |
shift_labels = shift_labels.view(-1).clone()
|
1743 |
-
print("shift logits after:", shift_logits)
|
1744 |
# Enable model parallelism
|
1745 |
shift_labels[shift_labels == self.tokenizer.pad_token_id] = -100
|
1746 |
shift_labels = shift_labels.to(shift_logits.device)
|
|
|
1737 |
shift_labels = labels[..., 1 + shift_amount:].contiguous()
|
1738 |
# Flatten the tokens
|
1739 |
loss_fct = CrossEntropyLoss(reduction="none")
|
1740 |
+
# print("Shift logits before:", shift_logits)
|
1741 |
shift_logits = shift_logits.view(-1, self.config.vocab_size)
|
1742 |
shift_labels = shift_labels.view(-1).clone()
|
1743 |
+
# print("shift logits after:", shift_logits)
|
1744 |
# Enable model parallelism
|
1745 |
shift_labels[shift_labels == self.tokenizer.pad_token_id] = -100
|
1746 |
shift_labels = shift_labels.to(shift_logits.device)
|