Spaces:

RSHVR
/

Command_RTC

Sleeping

App Files Files Community

RSHVR commited on Jun 4

Commit

d8d34de

verified ·

1 Parent(s): aacbb48

Fix state and Add concurrency

Browse files

State: Fixed issue where conversation history would persist across users and new chats
Concurrency: Added concurrency support using async

Files changed (1) hide show

app.py +25 -6

app.py CHANGED Viewed

@@ -4,8 +4,6 @@ import os
 import cohereAPI
-# Conversation history storage
-conversation_history = []
 # Model configurations
 COHERE_MODELS = [
@@ -33,9 +31,30 @@ def show_model_change_info(model_name):
     return model_name
-def respond(message, history, model_name="command-a-03-2025"):
     """Generate streaming response using Cohere API"""
-    global conversation_history
     # Get API key from environment
     api_key = os.getenv('COHERE_API_KEY')
@@ -49,9 +68,9 @@ def respond(message, history, model_name="command-a-03-2025"):
                         Do not repeat the user's question in your response. Do not exceed 50 words."""
     try:
-        # Use streaming function
         partial_message = ""
-        for chunk in cohereAPI.send_message_stream(
             system_message=system_message,
             user_message=message,
             conversation_history=conversation_history,

 import cohereAPI
 # Model configurations
 COHERE_MODELS = [
     return model_name
+async def respond(message, history, model_name="command-a-03-2025"):
     """Generate streaming response using Cohere API"""
+    # Convert Gradio history format to API format
+    conversation_history = []
+    if history:
+        for entry in history:
+            if isinstance(entry, dict):
+                # Clean dict format - only keep role and content
+                if "role" in entry and "content" in entry:
+                    conversation_history.append({
+                        "role": entry["role"],
+                        "content": entry["content"]
+                    })
+            elif isinstance(entry, (list, tuple)) and len(entry) == 2:
+                # Old format: [user_msg, assistant_msg]
+                user_msg, assistant_msg = entry
+                if user_msg:
+                    conversation_history.append({"role": "user", "content": str(user_msg)})
+                if assistant_msg:
+                    conversation_history.append({"role": "assistant", "content": str(assistant_msg)})
+            else:
+                # Handle other formats gracefully
+                continue
     # Get API key from environment
     api_key = os.getenv('COHERE_API_KEY')
                         Do not repeat the user's question in your response. Do not exceed 50 words."""
     try:
+        # Use async streaming function
         partial_message = ""
+        async for chunk in cohereAPI.send_message_stream_async(
             system_message=system_message,
             user_message=message,
             conversation_history=conversation_history,