Spaces:

vpkprasanna
/

TokenizerViz

Sleeping

App Files Files Community

prasanna kumar commited on Aug 30, 2024

Commit

b9a925b

1 Parent(s): 3c6d585

add default values for models and shown some examples for easy try

Browse files

Files changed (1) hide show

app.py +21 -1

app.py CHANGED Viewed

@@ -67,16 +67,26 @@ def process_input(input_type, input_value, model_name):
     return analysis, " ".join(tokens), str(token_ids), words_hist, special_chars_hist, numbers_hist
 with gr.Blocks() as iface:
     gr.Markdown("# LLM Tokenization - Convert Text to tokens and vice versa!")
     gr.Markdown("Enter text or token IDs and select a model to see the results, including word count, token analysis, and histograms of most common elements.")
     with gr.Row():
         input_type = gr.Radio(["Text", "Token IDs"], label="Input Type", value="Text")
-        model_name = gr.Dropdown(choices=MODELS, label="Select Model")
     input_text = gr.Textbox(lines=5, label="Input")
     submit_button = gr.Button("Process")
     analysis_output = gr.Textbox(label="Analysis", lines=6)
@@ -88,6 +98,16 @@ with gr.Blocks() as iface:
         special_chars_plot = gr.Plot(label="Most Common Special Characters")
         numbers_plot = gr.Plot(label="Most Common Numbers")
     submit_button.click(
         process_input,
         inputs=[input_type, input_text, model_name],

     return analysis, " ".join(tokens), str(token_ids), words_hist, special_chars_hist, numbers_hist
+def text_example():
+    return "Hello, world! This is an example text input for tokenization."
+def token_ids_example():
+    return "[128000, 9906, 11, 1917, 0, 1115, 374, 459, 3187, 1495, 1988, 369, 4037, 2065, 13]"
 with gr.Blocks() as iface:
     gr.Markdown("# LLM Tokenization - Convert Text to tokens and vice versa!")
     gr.Markdown("Enter text or token IDs and select a model to see the results, including word count, token analysis, and histograms of most common elements.")
     with gr.Row():
         input_type = gr.Radio(["Text", "Token IDs"], label="Input Type", value="Text")
+        model_name = gr.Dropdown(choices=MODELS, label="Select Model",value=MODELS[0])
     input_text = gr.Textbox(lines=5, label="Input")
+    with gr.Row():
+        text_example_button = gr.Button("Load Text Example")
+        token_ids_example_button = gr.Button("Load Token IDs Example")
     submit_button = gr.Button("Process")
     analysis_output = gr.Textbox(label="Analysis", lines=6)
         special_chars_plot = gr.Plot(label="Most Common Special Characters")
         numbers_plot = gr.Plot(label="Most Common Numbers")
+    text_example_button.click(
+        lambda: (text_example(), "Text"),
+        outputs=[input_text, input_type]
+    )
+    token_ids_example_button.click(
+        lambda: (token_ids_example(), "Token IDs"),
+        outputs=[input_text, input_type]
+    )
     submit_button.click(
         process_input,
         inputs=[input_type, input_text, model_name],