Spaces:

AbstractPhil
/

GPT-OSS-20B-Mirel

Running on Zero

App Files Files Community

AbstractPhil commited on 23 days ago

Commit

e7eb866

1 Parent(s): 206ca02

oauth

Browse files

Files changed (1) hide show

app.py +36 -36

app.py CHANGED Viewed

@@ -341,47 +341,47 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
     )
     # Sign-in note
-login_status = gr.Markdown(
-    "If you're logged into huggingface.co in this browser, ZeroGPU will use *your* quota automatically."
-)
-with gr.Row():
-    system_prompt = gr.Textbox(label="System", value=SYSTEM_DEF)
-with gr.Accordion("Generation settings", open=False):
-    with gr.Row():
-        temperature = gr.Slider(0.0, 2.0, value=0.7, step=0.05, label="temperature")
-        top_p       = gr.Slider(0.1, 1.0, value=0.9, step=0.01, label="top_p")
-        top_k       = gr.Slider(0, 200, value=0, step=1, label="top_k (0=off)")
-        max_new     = gr.Slider(16, 2048, value=MAX_DEF, step=8, label="max_new_tokens")
-        do_sample   = gr.Checkbox(value=True, label="do_sample")
-        seed        = gr.Number(value=None, label="seed (optional)")
-with gr.Accordion("Rose guidance (optional)", open=False):
     with gr.Row():
-        rose_enable = gr.Checkbox(value=False, label="Enable Rose bias at decode")
-        rose_alpha  = gr.Slider(0.0, 5.0, value=1.0, step=0.05, label="rose alpha (strength)")
-        rose_score  = gr.Slider(0.0, 1.0, value=1.0, step=0.01, label="rose score (0–1)")
-    rose_tokens = gr.Textbox(label="token:weight list (comma-separated)", value="")
-    rose_json   = gr.Textbox(label="JSON {token: weight}", value="")
-chat = gr.ChatInterface(
-    fn=generate_stream,
-    type="messages",
-    additional_inputs=[system_prompt, temperature, top_p, top_k, max_new, do_sample, seed, rose_enable, rose_alpha, rose_score, rose_tokens, rose_json],
-    title="Mirel",
-    cache_examples=False,
-)
-gr.Markdown(
     """
-**Notes**
-- Set env `ZEROGPU=1` for just-in-time GPU allocation via @spaces.GPU.
-- Set `ADAPTER_ID=AbstractPhil/mirel-gpt-oss-20b` and `ADAPTER_SUBFOLDER=checkpoints/checkpoint-516` to use the provided adapter.
-- Use `torch==2.4.0` for ZeroGPU.
-- Rose guidance biases logits; it does not change weights.
-"""
-)
 if __name__ == "__main__":
     demo.queue(max_size=8 if ZEROGPU else 32).launch(server_name="0.0.0.0", server_port=7860)

     )
     # Sign-in note
+    login_status = gr.Markdown(
+        "If you're logged into huggingface.co in this browser, ZeroGPU will use *your* quota automatically."
+    )
     with gr.Row():
+        system_prompt = gr.Textbox(label="System", value=SYSTEM_DEF)
+    with gr.Accordion("Generation settings", open=False):
+        with gr.Row():
+            temperature = gr.Slider(0.0, 2.0, value=0.7, step=0.05, label="temperature")
+            top_p       = gr.Slider(0.1, 1.0, value=0.9, step=0.01, label="top_p")
+            top_k       = gr.Slider(0, 200, value=0, step=1, label="top_k (0=off)")
+            max_new     = gr.Slider(16, 2048, value=MAX_DEF, step=8, label="max_new_tokens")
+            do_sample   = gr.Checkbox(value=True, label="do_sample")
+            seed        = gr.Number(value=None, label="seed (optional)")
+    with gr.Accordion("Rose guidance (optional)", open=False):
+        with gr.Row():
+            rose_enable = gr.Checkbox(value=False, label="Enable Rose bias at decode")
+            rose_alpha  = gr.Slider(0.0, 5.0, value=1.0, step=0.05, label="rose alpha (strength)")
+            rose_score  = gr.Slider(0.0, 1.0, value=1.0, step=0.01, label="rose score (0–1)")
+        rose_tokens = gr.Textbox(label="token:weight list (comma-separated)", value="")
+        rose_json   = gr.Textbox(label="JSON {token: weight}", value="")
+    chat = gr.ChatInterface(
+        fn=generate_stream,
+        type="messages",
+        additional_inputs=[system_prompt, temperature, top_p, top_k, max_new, do_sample, seed, rose_enable, rose_alpha, rose_score, rose_tokens, rose_json],
+        title="Mirel",
+        cache_examples=False,
+    )
+    gr.Markdown(
+        """
+    **Notes**
+    - Set env `ZEROGPU=1` for just-in-time GPU allocation via @spaces.GPU.
+    - Set `ADAPTER_ID=AbstractPhil/mirel-gpt-oss-20b` and `ADAPTER_SUBFOLDER=checkpoints/checkpoint-516` to use the provided adapter.
+    - Use `torch==2.4.0` for ZeroGPU.
+    - Rose guidance biases logits; it does not change weights.
     """
+    )
 if __name__ == "__main__":
     demo.queue(max_size=8 if ZEROGPU else 32).launch(server_name="0.0.0.0", server_port=7860)