Zipstack · tahierhussain · May 5, 2026 · May 5, 2026 · May 5, 2026 · abhizipstack
@@ -326,9 +326,18 @@ def _process_completed(self, *args, **kwargs):
         # On successful completion, Closing the event thread
         raise StopIteration
 
+    def _process_chat_intent(self, *args, **kwargs):
+        send_socket_message(
+            sid=kwargs["sid"],
+            channel_id=kwargs["channel_id"],
+            chat_id=kwargs["chat_id"],
+            chat_message_id=kwargs["chat_message_id"],
+            chat_intent_name=kwargs.get("chat_intent"),
+        )
+
     def process_event(self, *args, **kwargs):
         supported_events = ["thought_chain", "prompt_response",
-                            "summary", "chat_name", "completed"]
+                            "summary", "chat_name", "completed", "chat_intent"]
         event_type = kwargs.get("event_type")
         if event_type not in supported_events:
             raise ValueError(f"Unsupported event type: {event_type}")

@@ -144,37 +144,30 @@ def persist_prompt(
         llm_model_architect: str,
         llm_model_developer: str,
         generated_chat_res_id: str = None,
-        chat_intent_id: str = None,
         chat_id: str = None,
         user=None,
     ) -> ChatMessage:
         """
         Create a new prompt within a Chat. If chat_id is None, create a new Chat.
         Return the chat_message_id of the newly created ChatMessage.
+        chat_intent is left null here; the AI service auto-detects it and the
+        backend persists it on the message when the response arrives.
         """
         if not prompt.strip():
             raise InvalidChatPrompt()
 
-        chat_intent = None
         transformation_type = 'TRANSFORM' if  discussion_type == 'GENERATE' else 'DISCUSSION'
-        if chat_intent_id:
-            try:
-                chat_intent = ChatIntent.objects.get(chat_intent_id=chat_intent_id)
-            except ChatIntent.DoesNotExist:
-                chat_intent = None
 
         if not chat_id:
             chat = Chat.objects.create(
                 project=self.project_instance,
                 chat_name="Untitled Chat",
-                chat_intent=chat_intent,
                 llm_model_architect=llm_model_architect,
                 llm_model_developer=llm_model_developer,
                 user=user,
             )
         else:
             chat = self._get_chat_or_raise(chat_id=chat_id, must_be_active=True)
-            chat.chat_intent = chat_intent
             chat.llm_model_architect = llm_model_architect
             chat.llm_model_developer = llm_model_developer
             chat.discussion_type = discussion_type
@@ -185,7 +178,6 @@ def persist_prompt(
         chat_message = ChatMessage.objects.create(
             chat=chat,
             prompt=prompt,
-            chat_intent=chat_intent,
             llm_model_architect=llm_model_architect,
             llm_model_developer=llm_model_developer,
             discussion_type= discussion_type,

@@ -1,6 +1,6 @@
 import json
 import logging
-from typing import Any
+from typing import Any, Optional
 
 import eventlet
 import redis
@@ -52,12 +52,47 @@ def create_redis_xgroup(self, channel_id, group_id):
             else:
                 raise
 
+    def _resolve_chat_intent(self, chat_message_id: str, data: dict, content: Any) -> Optional[str]:
+        """
+        Pull the AI-detected chat_intent out of the inbound payload and persist it
+        to ChatMessage.chat_intent the first time we see it for a given message.
+        Subsequent events re-use the cached value.
+        """
+        if not hasattr(self, "_chat_intent_by_msg"):
+            self._chat_intent_by_msg = {}
+
+        cached = self._chat_intent_by_msg.get(chat_message_id)
+        if cached:
+            return cached
+
+        intent_name = data.get("chat_intent")
+        if not intent_name and isinstance(content, dict):
+            intent_name = content.get("chat_intent")
+        if not intent_name:
+            return None
+
+        try:
+            from backend.core.models.chat_intent import ChatIntent
+            from backend.core.models.chat_message import ChatMessage
+            chat_intent = ChatIntent.objects.get(name=intent_name)
+            chat_message = ChatMessage.objects.get(chat_message_id=chat_message_id)
+            chat_message.chat_intent = chat_intent
+            chat_message.save(update_fields=["chat_intent"])
+            # Mirror the pre-PR behavior where Chat.chat_intent tracked the
+            # latest message's intent (used by PastConversations badge).
+            chat_message.chat.chat_intent = chat_intent
+            chat_message.chat.save(update_fields=["chat_intent"])
+        except Exception as e:
+            logging.error(f"Failed to persist chat_intent={intent_name}: {e}")
+
+        self._chat_intent_by_msg[chat_message_id] = intent_name
+        return intent_name
+
     def process_message(
         self,
         sid: str,
         channel_id: str,
         chat_id: str,
-        chat_intent: str,
         payload: dict[str, Any],
         discussion_status: str
     ):
@@ -75,6 +110,7 @@ def process_message(
             2: "summary",
             3: "chat_name",
             4: "completed",
+            5: "chat_intent",
             99: "stop",
         }
 
@@ -83,6 +119,8 @@ def process_message(
         chat_message_id = data["chat_message_id"]
         content = data["content"]
 
+        chat_intent = self._resolve_chat_intent(chat_message_id, data, content)
+
         if event_type == "chat_name":
             self.chat_name = data["content"]
             self.persist_response(
@@ -120,7 +158,7 @@ def _validate_message(self, group_id, channel_id):
         )
         return messages
 
-    def _handle_redis_message(self, sid, channel_id, chat_id, chat_intent, group_id, messages, discussion_status: str):
+    def _handle_redis_message(self, sid, channel_id, chat_id, group_id, messages, discussion_status: str):
         for _, msg_list in messages:
             for message_id, payload in msg_list:
                 logging.info(f" === Message ID: {message_id} ===")
@@ -129,7 +167,6 @@ def _handle_redis_message(self, sid, channel_id, chat_id, chat_intent, group_id,
                         sid=sid,
                         channel_id=channel_id,
                         chat_id=chat_id,
-                        chat_intent=chat_intent,
                         payload=payload,
                         discussion_status=discussion_status
                     )
@@ -138,7 +175,7 @@ def _handle_redis_message(self, sid, channel_id, chat_id, chat_intent, group_id,
                     self.redis_client.xack(channel_id, group_id, message_id)
 
     def __stream_listener(
-        self, sid: str, channel_id: str, chat_id: str, chat_message_id: str, chat_intent: str, group_id: str, discussion_status: str
+        self, sid: str, channel_id: str, chat_id: str, chat_message_id: str, group_id: str, discussion_status: str
     ):
 
         while True:
@@ -148,7 +185,7 @@ def __stream_listener(
                 if not messages:
                     continue
 
-                self._handle_redis_message(sid, channel_id, chat_id, chat_intent, group_id, messages, discussion_status)
+                self._handle_redis_message(sid, channel_id, chat_id, group_id, messages, discussion_status)
 
             except redis.exceptions.RedisError as e:
                 logging.error(f"[REDIS ERROR] {e}")
@@ -196,15 +233,15 @@ def __stream_listener(
                 )
                 break
 
-    def listen_to_redis_stream(self, sid: str, channel_id: str, chat_id: str, chat_message_id: str, chat_intent: str, discussion_status: str):
+    def listen_to_redis_stream(self, sid: str, channel_id: str, chat_id: str, chat_message_id: str, discussion_status: str):
         """Listens to the Redis stream from llm server and processes the messages."""
         group_id = f"group_{chat_id}_{chat_message_id}"
         self.create_redis_xgroup(channel_id, group_id)
-        self.__stream_listener(sid, channel_id, chat_id, chat_message_id, chat_intent, group_id, discussion_status)
+        self.__stream_listener(sid, channel_id, chat_id, chat_message_id, group_id, discussion_status)
 
-    def stream_prompt_response(self, sid: str, channel_id: str, chat_id: str, chat_message_id: str, chat_intent: str, discussion_status: str):
+    def stream_prompt_response(self, sid: str, channel_id: str, chat_id: str, chat_message_id: str, discussion_status: str):
         """Starts a background thread to listen redis pubsub channel from AI server"""
-        args = (sid, channel_id, chat_id, chat_message_id, chat_intent, discussion_status)
+        args = (sid, channel_id, chat_id, chat_message_id, discussion_status)
         try:
             sio.start_background_task(self.listen_to_redis_stream, *args)
         except Exception as e:
@@ -237,12 +274,10 @@ def process_prompt(self, sid: str, channel_id: str, chat_id: str, chat_message_i
                 "GENERATE": ChatMessageStatus.GENERATE,
             }
             if is_retry:
-                chat_intent = ChatMessageStatus.TRANSFORM_RETRY
                 prompt = (
                     f"Faulty yaml:{chat_message.technical_content} \n Error:{chat_message.transformation_error_message}"
                 )
             else:
-                chat_intent = chat_message.chat_intent.name
                 prompt = chat_message.prompt
 
             if discussion_status in DISCUSSION_STATUS_MAP:
@@ -311,7 +346,6 @@ def process_prompt(self, sid: str, channel_id: str, chat_id: str, chat_message_i
                 "db_map": db_metadata,
                 "visitran_model": visitran_models,
                 "chat_name": chat_name,
-                "chat_intent": chat_intent,
                 "db_type": self.project_instance.database_type,
                 "llm_model_architect": chat_message.llm_model_architect,
                 "llm_model_developer": chat_message.llm_model_developer,
@@ -335,7 +369,6 @@ def process_prompt(self, sid: str, channel_id: str, chat_id: str, chat_message_i
                     channel_id=channel_id,
                     chat_id=chat_id,
                     chat_message_id=chat_message_id,
-                    chat_intent=chat_intent,
                     discussion_status=chat_message.discussion_type,
                 )
 
@@ -347,10 +380,9 @@ def process_prompt(self, sid: str, channel_id: str, chat_id: str, chat_message_i
                     channel_id=channel_id,
                     chat_id=chat_id,
                     chat_message_id=chat_message_id,
-                    chat_intent=chat_intent,
                     discussion_status=chat_message.discussion_type,
                 )
-            logging.info(f"process_prompt: chat_intent={chat_intent}, sid={sid}, channel_id={channel_id}")
+            logging.info(f"process_prompt: sid={sid}, channel_id={channel_id}")
             chat_message = self._get_chat_message(chat_id=chat_id, chat_message_id=chat_message_id)
 
             return chat_message

@@ -5,6 +5,9 @@
 
 class ChatSerializer(serializers.ModelSerializer):
     user = UserMinimalSerializer(read_only=True)
+    chat_intent_name = serializers.CharField(
+        source='chat_intent.display_name', read_only=True, default=None
+    )
 
     class Meta:
         model = Chat
@@ -13,6 +16,7 @@ class Meta:
             'project_id',
             'chat_name',
             'chat_intent',
+            'chat_intent_name',
             'created_at',
             'modified_at',
             'is_deleted',

@@ -128,7 +128,6 @@ def persist_prompt(self, request: Request, project_id: str, *args, **kwargs) ->
         data = request.data
         chat_id = data.get("chat_id")
         prompt = data.get("prompt")
-        chat_intent_id = data.get("chat_intent_id")
         llm_model_architect = data.get("llm_model_architect")
         llm_model_developer = data.get("llm_model_developer")
         discussion_type = data.get('discussion_status')
@@ -139,26 +138,19 @@ def persist_prompt(self, request: Request, project_id: str, *args, **kwargs) ->
         if discussion_type == "GENERATE":
             generated_chat_res_id = data.get('final_discussion_id')
 
-        # Check token balance before processing the request
+        # Check token balance before processing the request.
+        # Intent is auto-detected by the AI service, so we don't know it yet —
+        # check against the worst-case (TRANSFORM) cost to avoid letting through
+        # a request the org can't afford.
         try:
             project = ProjectDetails.objects.get(project_uuid=project_id)
             organization = project.organization
 
-            # Determine chat intent name for token calculation
-            chat_intent_name = "INFO"  # Default
-            if chat_intent_id:
-                from backend.core.models.chat_intent import ChatIntent
-                try:
-                    chat_intent = ChatIntent.objects.get(chat_intent_id=chat_intent_id)
-                    chat_intent_name = chat_intent.name
-                except ChatIntent.DoesNotExist:
-                    pass
-
             self.fetch_token_balance(
                 llm_model_architect=llm_model_architect,
                 llm_model_developer=llm_model_developer,
                 organization=organization,
-                chat_intent_name=chat_intent_name
+                chat_intent_name="TRANSFORM"
             )
 
         except ProjectDetails.DoesNotExist:
@@ -172,7 +164,6 @@ def persist_prompt(self, request: Request, project_id: str, *args, **kwargs) ->
         chat_message = chat_message_context.persist_prompt(
             prompt=prompt,
             chat_id=chat_id,
-            chat_intent_id=chat_intent_id,
             llm_model_architect=llm_model_architect,
             llm_model_developer=llm_model_developer,
             discussion_type=discussion_type,

@@ -11,6 +11,7 @@ class Meta:
 
 class ChatMessageSerializer(serializers.ModelSerializer):
     user = UserMinimalSerializer(read_only=True)
+    chat_intent_name = serializers.CharField(source='chat_intent.name', read_only=True, default=None)
 
     class Meta:
         model = ChatMessage
@@ -29,6 +30,7 @@ class Meta:
             'transformation_status',
             'transformation_error_message',
             'chat_intent',
+            'chat_intent_name',
             'llm_model_architect',
             'llm_model_developer',
             'created_at',

@@ -263,6 +263,7 @@ def send_socket_message(sid, channel_id, **kwargs):
         "is_retry_transform",
         "discussion_status",
         "token_usage_data",  # Add token usage data
+        "chat_intent_name",
     ]
 
     unsupported_args = [arg for arg in kwargs.keys() if arg not in allowed_args]

@@ -25,7 +25,6 @@ const INFO_APPROVED =
 const ActionButtons = memo(function ActionButtons({
   chatMessageId,
   savePrompt,
-  selectedChatIntent,
   isLatestTransform,
   uiAction,
   message,
@@ -101,12 +100,12 @@ const ActionButtons = memo(function ActionButtons({
       setTimeout(() => setIsOperationInProgress(false), 3000);
 
       if (value === "GENERATE") {
-        savePrompt?.(label, selectedChatIntent, false, value, chatMessageId);
+        savePrompt?.(label, false, value, chatMessageId);
         return;
       }
-      savePrompt?.(label, selectedChatIntent, false, value);
+      savePrompt?.(label, false, value);
     },
-    [savePrompt, selectedChatIntent, chatMessageId, isOperationInProgress]
+    [savePrompt, chatMessageId, isOperationInProgress]
   );
 
   const onApplyClick = useCallback(() => {
@@ -321,7 +320,6 @@ ActionButtons.displayName = "ActionButtons";
 ActionButtons.propTypes = {
   chatMessageId: PropTypes.string.isRequired,
   savePrompt: PropTypes.func,
-  selectedChatIntent: PropTypes.string,
   isLatestTransform: PropTypes.bool.isRequired,
   uiAction: PropTypes.object,
   message: PropTypes.object,