Spaces:

nazdridoy
/

inferoxy-hub

Running

App Files Files Community

nazdridoy commited on Aug 22

Commit

a6a8ac0

verified ·

1 Parent(s): 9aff9bb

feat(chat): always display model reasoning

Browse files

- [remove] Remove `show_reasoning` parameter from `handle_chat_submit` and `handle_chat_retry` (chat_handler.py:168,275)
- [feat] Hardcode `render_with_reasoning_toggle` to `True` in `handle_chat_submit` and `handle_chat_retry` (chat_handler.py:203,275)
- [remove] Remove `show_reasoning` checkbox and its usage in chat event handlers (ui_components.py:52-57,87-88,102-103,124-125)

Files changed (2) hide show

chat_handler.py +4 -4
ui_components.py +3 -8

chat_handler.py CHANGED Viewed

@@ -168,7 +168,7 @@ def chat_respond(
         yield format_error_message("Unexpected Error", f"An unexpected error occurred: {error_msg}")
-def handle_chat_submit(message, history, system_msg, model_name, max_tokens, temperature, top_p, show_reasoning=False, hf_token: gr.OAuthToken = None):
     """
     Handle chat submission and manage conversation history with streaming.
     """
@@ -203,13 +203,13 @@ def handle_chat_submit(message, history, system_msg, model_name, max_tokens, tem
     # Stream the assistant response token by token
     assistant_response = ""
     for partial_response in response_generator:
-        assistant_response = render_with_reasoning_toggle(partial_response, bool(show_reasoning))
         # Update history with the current partial response and yield it
         current_history = history + [{"role": "assistant", "content": assistant_response}]
         yield current_history, ""
-def handle_chat_retry(history, system_msg, model_name, max_tokens, temperature, top_p, show_reasoning=False, hf_token: gr.OAuthToken = None, retry_data=None):
     """
     Retry the assistant response for the selected message.
     Works with gr.Chatbot.retry() which provides retry_data.index for the message.
@@ -275,6 +275,6 @@ def handle_chat_retry(history, system_msg, model_name, max_tokens, temperature,
     assistant_response = ""
     for partial_response in response_generator:
-        assistant_response = render_with_reasoning_toggle(partial_response, bool(show_reasoning))
         current_history = trimmed_history + [{"role": "assistant", "content": assistant_response}]
         yield current_history

         yield format_error_message("Unexpected Error", f"An unexpected error occurred: {error_msg}")
+def handle_chat_submit(message, history, system_msg, model_name, max_tokens, temperature, top_p, hf_token: gr.OAuthToken = None):
     """
     Handle chat submission and manage conversation history with streaming.
     """
     # Stream the assistant response token by token
     assistant_response = ""
     for partial_response in response_generator:
+        assistant_response = render_with_reasoning_toggle(partial_response, True)
         # Update history with the current partial response and yield it
         current_history = history + [{"role": "assistant", "content": assistant_response}]
         yield current_history, ""
+def handle_chat_retry(history, system_msg, model_name, max_tokens, temperature, top_p, hf_token: gr.OAuthToken = None, retry_data=None):
     """
     Retry the assistant response for the selected message.
     Works with gr.Chatbot.retry() which provides retry_data.index for the message.
     assistant_response = ""
     for partial_response in response_generator:
+        assistant_response = render_with_reasoning_toggle(partial_response, True)
         current_history = trimmed_history + [{"role": "assistant", "content": assistant_response}]
         yield current_history

ui_components.py CHANGED Viewed

@@ -52,11 +52,6 @@ def create_chat_tab(handle_chat_submit_fn, handle_chat_retry_fn=None):
                     lines=2,
                     placeholder="Define the assistant's personality and behavior..."
                 )
-                show_reasoning = gr.Checkbox(
-                    value=False,
-                    label="Show reasoning (<think>…</think>)",
-                    info="Reveal model's reasoning, if present",
-                )
             with gr.Column(scale=1):
                 chat_max_tokens = gr.Slider(
@@ -87,7 +82,7 @@ def create_chat_tab(handle_chat_submit_fn, handle_chat_retry_fn=None):
         chat_send_event = chat_submit.click(
             fn=handle_chat_submit_fn,
             inputs=[chat_input, chatbot_display, chat_system_message, chat_model_name,
-                   chat_max_tokens, chat_temperature, chat_top_p, show_reasoning],
             outputs=[chatbot_display, chat_input]
         )
@@ -102,7 +97,7 @@ def create_chat_tab(handle_chat_submit_fn, handle_chat_retry_fn=None):
         chat_enter_event = chat_input.submit(
             fn=handle_chat_submit_fn,
             inputs=[chat_input, chatbot_display, chat_system_message, chat_model_name,
-                   chat_max_tokens, chat_temperature, chat_top_p, show_reasoning],
             outputs=[chatbot_display, chat_input]
         )
@@ -124,7 +119,7 @@ def create_chat_tab(handle_chat_submit_fn, handle_chat_retry_fn=None):
             chatbot_display.retry(
                 fn=handle_chat_retry_fn,
                 inputs=[chatbot_display, chat_system_message, chat_model_name,
-                        chat_max_tokens, chat_temperature, chat_top_p, show_reasoning],
                 outputs=chatbot_display
             )

                     lines=2,
                     placeholder="Define the assistant's personality and behavior..."
                 )
             with gr.Column(scale=1):
                 chat_max_tokens = gr.Slider(
         chat_send_event = chat_submit.click(
             fn=handle_chat_submit_fn,
             inputs=[chat_input, chatbot_display, chat_system_message, chat_model_name,
+                   chat_max_tokens, chat_temperature, chat_top_p],
             outputs=[chatbot_display, chat_input]
         )
         chat_enter_event = chat_input.submit(
             fn=handle_chat_submit_fn,
             inputs=[chat_input, chatbot_display, chat_system_message, chat_model_name,
+                   chat_max_tokens, chat_temperature, chat_top_p],
             outputs=[chatbot_display, chat_input]
         )
             chatbot_display.retry(
                 fn=handle_chat_retry_fn,
                 inputs=[chatbot_display, chat_system_message, chat_model_name,
+                        chat_max_tokens, chat_temperature, chat_top_p],
                 outputs=chatbot_display
             )