diff --git a/hft.py b/hft.py index 7ca3dcb..4346b56 100644 --- a/hft.py +++ b/hft.py @@ -127,8 +127,8 @@ class CustomModel(nn.Module): def forward(self, input_ids=None, attention_mask=None, labels=None, source_idx=None, **kwargs): if source_idx is not None: - print("Max source_idx:", torch.max(source_idx)) - print("Num embeddings:", self.source_embedding.num_embeddings) + #print("Max source_idx:", torch.max(source_idx)) + #print("Num embeddings:", self.source_embedding.num_embeddings) source_idx = torch.clamp(source_idx, 0, self.source_embedding.num_embeddings - 1) source_embeds = self.source_embedding(source_idx).unsqueeze(1).expand(-1, input_ids.size(1), -1) hidden_states = self.base_model.get_input_embeddings()(input_ids) + source_embeds