add comment

2024-03-09 11:03:30 +08:00
parent bc182d09e0
commit 104f521f79
2 changed files with 5 additions and 1 deletions
--- a/llama/rellama.py
+++ b/llama/rellama.py
@ -133,8 +133,10 @@ class Method_1(ReLlamaForCausalLM):
            for i in range(predict_logits.size(0)):
                # iterate over the batch
                
+                # token [1] is the start of response (bos token)
                start_idx = torch.where(labels[i] == 1)[0].item()

+                # if [-100] in response, we should calculate kl_div loss for that position
                maintain_position: List[int] = []
                for idx in range(start_idx, labels[i].size(0)):
                    if labels[i][idx] == -100: