Spaces:

HemanM
/

EvoConvo

Sleeping

HemanM commited on Aug 4

Commit

74435ef

verified ·

1 Parent(s): 2f5aba0

Update generate.py

Files changed (1) hide show

generate.py CHANGED Viewed

@@ -24,13 +24,14 @@ def generate_response(prompt, max_length=100, top_k=40):
             # Top-k sampling
             top_k_probs, top_k_indices = torch.topk(next_token_logits, top_k)
-            probs = torch.softmax(top_k_probs.squeeze(0), dim=-1)  # Flatten
             sampled_index = torch.multinomial(probs, 1).item()
             next_token = top_k_indices[0, sampled_index]
-        input_ids = torch.cat([input_ids, next_token.unsqueeze(0)], dim=1)
-        # Stop if EOS token
         if next_token.item() == tokenizer.eos_token_id:
             break

             # Top-k sampling
             top_k_probs, top_k_indices = torch.topk(next_token_logits, top_k)
+            probs = torch.softmax(top_k_probs.squeeze(0), dim=-1)
             sampled_index = torch.multinomial(probs, 1).item()
             next_token = top_k_indices[0, sampled_index]
+        # Reshape next_token to match input_ids shape
+        next_token = next_token.unsqueeze(0).unsqueeze(0)  # Shape: (1, 1)
+        input_ids = torch.cat([input_ids, next_token], dim=1)
         if next_token.item() == tokenizer.eos_token_id:
             break