Spaces:

jdelavande
/

chat-ui-energy

Running on CPU Upgrade

nsarrazin commited on Mar 6

Commit

7139d72

unverified ·

1 Parent(s): 10fd4a2

feat(hchat): add QwQ-32B to prod HuggingChat config (#1746)

Files changed (1) hide show

chart/env/prod.yaml CHANGED Viewed

@@ -197,23 +197,16 @@ envVars:
         ]
       },
       {
-        "name": "Qwen/QwQ-32B-Preview",
         "preprompt": "You are a helpful and harmless assistant. You are Qwen developed by Alibaba. You should think step-by-step.",
-        "modelUrl": "https://huggingface.co/Qwen/QwQ-32B-Preview",
-        "websiteUrl": "https://qwenlm.github.io/blog/qwq-32b-preview/",
         "logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/qwen-logo.png",
-        "description": "QwQ is an experiment model from the Qwen Team with advanced reasoning capabilities.",
         "reasoning": {
-          "type": "summarize"
-        },
-        "parameters": {
-          "stop": ["<|im_end|>"],
-          "truncate": 12288,
-          "max_new_tokens": 4096,
-          "temperature": 0.7,
-          "top_k": 20,
-          "top_p": 0.8,
-          "repetition_penalty": 1.05
         },
         "promptExamples": [
           {
@@ -228,6 +221,12 @@ envVars:
             "title": "Measuring 6 liters",
             "prompt": "I have a 6- and a 12-liter jug. I want to measure exactly 6 liters."
           }
         ]
       },
       {
@@ -433,6 +432,10 @@ envVars:
       {
         "name": "meta-llama/Meta-Llama-3.1-70B-Instruct",
         "transferTo": "meta-llama/Llama-3.3-70B-Instruct"
       }
     ]
   PUBLIC_ORIGIN: "https://huggingface.co"

         ]
       },
       {
+        "name": "Qwen/QwQ-32B",
         "preprompt": "You are a helpful and harmless assistant. You are Qwen developed by Alibaba. You should think step-by-step.",
+        "modelUrl": "https://huggingface.co/Qwen/QwQ-32B",
+        "websiteUrl": "https://qwenlm.github.io/blog/qwq-32b/",
         "logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/qwen-logo.png",
+        "description": "QwQ is the latest reasoning model released by the Qwen team, approaching the capabilities of R1 in benchmarks.",
         "reasoning": {
+          "type": "tokens",
+          "beginToken": "",
+          "endToken": "</think>"
         },
         "promptExamples": [
           {
             "title": "Measuring 6 liters",
             "prompt": "I have a 6- and a 12-liter jug. I want to measure exactly 6 liters."
           }
+        ],
+        "endpoints": [
+          {
+            "type": "openai",
+            "baseURL": "https://internal.api-inference.huggingface.co/models/Qwen/QwQ-32B/v1"
+          }
         ]
       },
       {
       {
         "name": "meta-llama/Meta-Llama-3.1-70B-Instruct",
         "transferTo": "meta-llama/Llama-3.3-70B-Instruct"
+      },
+      {
+        "name": "Qwen/QwQ-32B-Preview",
+        "transferTo": "Qwen/QwQ-32B"
       }
     ]
   PUBLIC_ORIGIN: "https://huggingface.co"