Spaces:

MicoGuild
/

Olubakka

Sleeping

Sachi Wagaarachchi commited on May 5

Commit

0655268

1 Parent(s): 7778aa1

debug: attention

Files changed (1) hide show

src/chat_logic.py CHANGED Viewed

@@ -27,11 +27,19 @@ class ChatProcessor:
                 skip_special_tokens=True
             )
-            input_ids = pipe.tokenizer(prompt, return_tensors="pt").input_ids.to(pipe.model.device)
-            # Prepare generation kwargs
             generate_kwargs = {
-                "input_ids": input_ids,
                 "max_new_tokens": max_new_tokens,
                 "temperature": temperature,
                 "top_p": top_p,

                 skip_special_tokens=True
             )
+            # Get full tokenizer output
+            tokenized_inputs = pipe.tokenizer(prompt, return_tensors="pt")
+            # Determine model device
+            device = pipe.model.device
+            # Move all tensors to the correct device
+            inputs_on_device = {k: v.to(device) for k, v in tokenized_inputs.items()}
+            # Prepare generation kwargs with attention_mask
             generate_kwargs = {
+                "input_ids": inputs_on_device["input_ids"],
+                "attention_mask": inputs_on_device["attention_mask"],
                 "max_new_tokens": max_new_tokens,
                 "temperature": temperature,
                 "top_p": top_p,