Spaces:

sudipta26889
/

gradio-doc

Sleeping

App Files Files Community

sudipta26889 commited on 18 days ago

Commit

fdf4fd8

verified ·

1 Parent(s): 064bfc7

Update app.py

Browse files

Files changed (1) hide show

app.py +22 -10

app.py CHANGED Viewed

@@ -9,6 +9,7 @@
 # Requirements (in requirements.txt):
 #   gradio>=4.44.0
 #   huggingface_hub>=0.24.0
 #
 # Space secrets needed:
 #   - HUGGING_FACE_HUB_TOKEN or HF_TOKEN  (token must allow using the selected provider/model)
@@ -25,6 +26,22 @@ from typing import Any, Dict, Iterable, List, Optional, Tuple
 import gradio as gr
 from huggingface_hub import MCPClient
 # ----------------------------
 # Configuration
 # ----------------------------
@@ -126,8 +143,7 @@ def _format_tool_log(log_lines: List[str]) -> str:
 def _format_citations(cites: List[Tuple[str, Optional[str]]]) -> str:
     if not cites:
         return "_No citations captured yet._"
-    # Show up to the last 12 citations (tool name + optional URL/source)
-    last = cites[-12:]
     lines = []
     for (label, url) in last:
         if url:
@@ -170,7 +186,6 @@ async def stream_answer(
                 ctype = chunk.get("type")
                 if ctype == "tool_log":
-                    # Example: {"type": "tool_log", "tool": "...", "status": "started/finished"}
                     name = chunk.get("tool", "tool")
                     status = chunk.get("status", "")
                     _append_log(tool_log, f"- {name} **{status}**")
@@ -183,7 +198,7 @@ async def stream_answer(
                     yield {"delta": chunk.get("text", ""), "tool_log": _format_tool_log(tool_log), "citations": _format_citations(citations)}
                 elif ctype == "tool_result":
-                    # Try to capture a useful citation label and optional URL if present
                     tool_name = chunk.get("tool", "tool")
                     content = chunk.get("content")
                     url = None
@@ -214,7 +229,6 @@ async def stream_answer(
                     }
             else:
-                # Fallback if provider yields plain strings
                 yield {"delta": str(chunk), "tool_log": _format_tool_log(tool_log), "citations": _format_citations(citations)}
     except Exception as e:
@@ -279,12 +293,10 @@ with gr.Blocks(fill_height=True) as demo:
           - tool activity
           - citations
         """
-        # Start a new assistant message for streaming
         history_msgs = (history_msgs or []) + [{"role": "user", "content": user_msg}]
         history_msgs.append({"role": "assistant", "content": ""})
         yield history_msgs, gr.update(value="_No tool activity yet._"), gr.update(value="_No citations captured yet._")
-        # Compose messages for LLM
         messages_for_llm = to_llm_messages(history_msgs[:-1], user_msg, style_choice)
         async for chunk in stream_answer(messages_for_llm, MODEL_ID, PROVIDER, HF_TOKEN):
@@ -300,10 +312,10 @@ with gr.Blocks(fill_height=True) as demo:
 # ----------------------------
 # Gradio runtime (queue + launch)
 # ----------------------------
-# IMPORTANT: assign the queued app back to 'demo' for older Gradio versions.
 demo = demo.queue(max_size=32)
-# Always launch; Spaces runs this script directly.
 demo.launch(
-    ssr_mode=False
 )

 # Requirements (in requirements.txt):
 #   gradio>=4.44.0
 #   huggingface_hub>=0.24.0
+#   spaces        # only needed if your Space hardware is ZeroGPU
 #
 # Space secrets needed:
 #   - HUGGING_FACE_HUB_TOKEN or HF_TOKEN  (token must allow using the selected provider/model)
 import gradio as gr
 from huggingface_hub import MCPClient
+# -------------------------------------------------
+# Optional ZeroGPU shim (silences "No @spaces.GPU..." startup message)
+# -------------------------------------------------
+SPACES_ZERO_GPU = bool(os.environ.get("SPACE_ZERO_GPU", ""))  # HF sets this in ZeroGPU envs
+try:
+    import spaces  # type: ignore
+except Exception:
+    spaces = None  # not installed on CPU Spaces; harmless
+if spaces is not None:
+    @spaces.GPU  # this just lets ZeroGPU detect a GPU-capable function at startup
+    def _zero_gpu_probe():
+        # We don't actually need a GPU for this app (remote inference),
+        # but the decorated function's presence satisfies ZeroGPU's startup check.
+        return "ok"
 # ----------------------------
 # Configuration
 # ----------------------------
 def _format_citations(cites: List[Tuple[str, Optional[str]]]) -> str:
     if not cites:
         return "_No citations captured yet._"
+    last = cites[-12:]  # show recent
     lines = []
     for (label, url) in last:
         if url:
                 ctype = chunk.get("type")
                 if ctype == "tool_log":
                     name = chunk.get("tool", "tool")
                     status = chunk.get("status", "")
                     _append_log(tool_log, f"- {name} **{status}**")
                     yield {"delta": chunk.get("text", ""), "tool_log": _format_tool_log(tool_log), "citations": _format_citations(citations)}
                 elif ctype == "tool_result":
+                    # Capture a useful citation label and optional URL if present
                     tool_name = chunk.get("tool", "tool")
                     content = chunk.get("content")
                     url = None
                     }
             else:
                 yield {"delta": str(chunk), "tool_log": _format_tool_log(tool_log), "citations": _format_citations(citations)}
     except Exception as e:
           - tool activity
           - citations
         """
         history_msgs = (history_msgs or []) + [{"role": "user", "content": user_msg}]
         history_msgs.append({"role": "assistant", "content": ""})
         yield history_msgs, gr.update(value="_No tool activity yet._"), gr.update(value="_No citations captured yet._")
         messages_for_llm = to_llm_messages(history_msgs[:-1], user_msg, style_choice)
         async for chunk in stream_answer(messages_for_llm, MODEL_ID, PROVIDER, HF_TOKEN):
 # ----------------------------
 # Gradio runtime (queue + launch)
 # ----------------------------
+# Assign back for older Gradio versions.
 demo = demo.queue(max_size=32)
+# Always launch on Spaces (banner lines about "local URL" are normal).
 demo.launch(
+    ssr_mode=False  # if SSR gives you trouble; otherwise you can omit this
 )