ChatFAQ
diff --git a/‎back/Makefile‎
Lines changed: 1 addition & 0 deletions b/‎back/Makefile‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎back/back/apps/fsm/lib/__init__.py‎
Lines changed: 3 additions & 1 deletion b/‎back/back/apps/fsm/lib/__init__.py‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎back/back/apps/language_model/consumers/__init__.py‎
Lines changed: 119 additions & 28 deletions b/‎back/back/apps/language_model/consumers/__init__.py‎
Lines changed: 119 additions & 28 deletions
diff --git a/‎back/back/apps/language_model/urls.py‎
Lines changed: 1 addition & 0 deletions b/‎back/back/apps/language_model/urls.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎back/back/apps/language_model/views/tasks.py‎
Lines changed: 33 additions & 4 deletions b/‎back/back/apps/language_model/views/tasks.py‎
Lines changed: 33 additions & 4 deletions
diff --git a/‎back/back/config/middelware.py‎
Lines changed: 26 additions & 0 deletions b/‎back/back/config/middelware.py‎
Lines changed: 26 additions & 0 deletions
diff --git a/‎back/back/config/settings.py‎
Lines changed: 1 addition & 1 deletion b/‎back/back/config/settings.py‎
Lines changed: 1 addition & 1 deletion
@@ -32,6 +32,7 @@ apply_fixtures:
 celery_worker:
 	$(POETRY_RUN) celery -A back.config worker -l INFO -P solo
 
+#
 # create_fsm_fixtures:
 # 	./manage.py dumpdata fsm.fsmdefinition --indent 4 > back/apps/fsm/fixtures/initial.json
 #
 
@@ -125,7 +125,7 @@ async def next_state(self):
         is reached it makes sure everything is saved and cached into the DB to keep the system stateful
         """
         transitions = self.get_current_state_transitions()
-        
+
         if state_override := self.get_state_by_name(self.ctx.conversation.fsm_state_override):
             logger.debug("Overriding FSM state")
             logger.debug(f"FSM from ---> {self.current_state}")
@@ -148,6 +148,8 @@ async def next_state(self):
                 logger.debug(f"FSM to -----> {self.current_state}")
                 await self.run_current_state_events(transition_data)
 
+        await self.save_cache()
+
     async def run_current_state_events(self, transition_data=None):
         """
         It will call the RPC server, the procedure name is the event name declared in the fsm definition for the
 
@@ -1,4 +1,5 @@
 import json
+import time
 import uuid
 from logging import getLogger
 from typing import Awaitable, Callable, Dict, List, Optional, Union
@@ -29,6 +30,8 @@
 from chat_rag.llms import load_llm
 from chat_rag.llms.types import Content, Message, ToolResult, ToolUse
 
+from back.apps.health.models import Event
+
 logger = getLogger(__name__)
 
 
@@ -198,6 +201,40 @@ async def resolve_references(reference_kis, retriever_config):
     }
 
 
+async def log_llm_event(
+    event_type: str,
+    is_success: bool,
+    data: dict
+):
+    """
+    Async function to log LLM-related events to the Event model.
+
+    Parameters:
+    -----------
+    event_type : str
+        Type of event (e.g., 'llm_call_start', 'llm_call_complete')
+    is_success : bool
+        Whether the event represents a successful operation
+    llm_call_id : str
+        Unique identifier for the LLM call
+    llm_config_name : str
+        Name of the LLM configuration
+    conversation_id : int
+        ID of the conversation
+    start_time : float
+        Start time of the LLM call (used to calculate duration for 'complete' events)
+    additional_data : dict, optional
+        Any additional data to include in the event
+    """
+
+    # Create the event asynchronously
+    await database_sync_to_async(Event.objects.create)(
+        event_type=event_type,
+        is_success=is_success,
+        data=data
+    )
+
+
 async def query_llm(
     llm_config_name: str,
     conversation_id: int,
@@ -221,18 +258,20 @@ async def query_llm(
         # if the llm config is mistral then return an error that mistral is not supported yet
         if llm_config.llm_type == LLMChoices.MISTRAL.value:
             await error_handler({
-                "payload": {
-                    "errors": "Error: Mistral is temporarily unavailable. We're working to add support for it soon. For now, please select a different model like OpenAI.",
-                    "request_info": {"llm_config_name": llm_config_name},
-                }
-            })
+                    "errors": "Error: Mistral is temporarily unavailable. We're working to add support for it soon. For now, please select a different model provider like OpenAI.",
+                    "llm_config_name": llm_config_name,
+                    "conversation_id": conversation_id
+                },
+                event_type="llm_config_not_found"
+            )
     except LLMConfig.DoesNotExist:
         await error_handler({
-            "payload": {
                 "errors": f"LLM config with name: {llm_config_name} does not exist.",
-                "request_info": {"llm_config_name": llm_config_name},
-            }
-        })
+                "llm_config_name": llm_config_name,
+                "conversation_id": conversation_id
+            },
+            event_type="llm_config_not_found"
+        )
         return
 
     conv = await database_sync_to_async(Conversation.objects.get)(pk=conversation_id)
@@ -252,25 +291,28 @@ async def query_llm(
                 messages = messages[1:]
         elif not prev_messages:
             await error_handler({
-                "payload": {
-                    "errors": "Error: No previous messages and no messages provided.",
-                    "request_info": {"conversation_id": conversation_id},
-                }
-            })
+                "errors": "Error: No previous messages and no messages provided.",
+                "conversation_id": conversation_id,
+            },
+            )
             return
         if messages:
             new_messages.extend(messages)
     else:
         new_messages = messages
         if new_messages is None:
             await error_handler({
-                "payload": {
-                    "errors": "Error: No messages provided.",
-                    "request_info": {"conversation_id": conversation_id},
-                }
-            })
+                "errors": "Error: No messages provided.",
+                "conversation_id": conversation_id,
+            },
+            )
             return
 
+
+    # Generate a unique ID for this LLM call
+    llm_call_id = str(uuid.uuid4())
+    start_time = time.perf_counter()
+
     try:
         # Decrypt the API key from the LLMConfig if available.
         api_key = None
@@ -288,6 +330,25 @@ async def query_llm(
             api_key=api_key,
         )
 
+        await log_llm_event(
+            event_type="llm_call_start",
+            is_success=True,
+            data={
+                "llm_call_id": llm_call_id,
+                "llm_config_name": llm_config_name,
+                "conversation_id": conversation_id,
+                "temperature": temperature,
+                "max_tokens": max_tokens,
+                "seed": seed,
+                "tools": tools,
+                "tool_choice": tool_choice,
+                "messages": new_messages,
+                "schema": response_schema,
+                "cache_config": cache_config,
+                "stream": stream,
+            }
+        )
+
         if response_schema:
             response_message = await llm.aparse(
                 messages=new_messages,
@@ -356,14 +417,28 @@ async def query_llm(
                 "last_chunk": True,
             }
 
+        await log_llm_event(
+            event_type="llm_call_complete",
+            is_success=True,
+            data={
+                "llm_call_id": llm_call_id,
+                "duration_seconds": time.perf_counter() - start_time,
+            }
+        )
+
     except Exception as e:
-        logger.error("Error during LLM query", exc_info=e)
-        await error_handler({
-            "payload": {
+        logger.exception(f"Error during llm call: {e}")
+        await error_handler(
+            {
                 "errors": "There was an error generating the response. Please try again or contact the administrator.",
-                "request_info": {"conversation_id": conversation_id},
-            }
-        })
+                "error_message": str(e),
+                "llm_config_name": llm_config_name,
+                "conversation_id": conversation_id,
+                "llm_call_id": llm_call_id,
+                "duration_seconds": time.perf_counter() - start_time,
+            },
+            event_type="llm_call_complete",
+        )
         return
 
 
@@ -449,6 +524,7 @@ async def process_llm_request(self, data):
 
         lm_msg_id = str(uuid.uuid4())
         data = serializer.validated_data
+
         async for chunk in query_llm(
             data["llm_config_name"],
             data["conversation_id"],
@@ -463,7 +539,7 @@ async def process_llm_request(self, data):
             data.get("cache_config"),
             data.get("response_schema"),
             data.get("stream"),
-            error_handler=self.error_response,
+            error_handler=self.llm_error_response,
         ):
             await self.send(
                 json.dumps(
@@ -555,9 +631,24 @@ async def process_prompt_request(self, data):
                 }
             )
 
-
-
     async def error_response(self, data: dict):
         data["status"] = WSStatusCodes.bad_request.value
         data["type"] = RPCMessageType.error.value
         await self.send(json.dumps(data))
+
+    async def llm_error_response(self, data: dict, event_type: str = None):
+        if event_type:
+            await log_llm_event(
+                event_type=event_type,
+                is_success=False,
+                data=data
+            )
+        # This is info sent to the SDK, so don't send a detailed error message for now.
+        return await self.error_response(
+            {
+                "payload": {
+                    "errors": data["errors"],
+                    "request_info": {"conversation_id": data["conversation_id"], "llm_config_name": data["llm_config_name"]},
+                }
+            }
+        )
@@ -21,6 +21,7 @@
 
 urlpatterns += [
     path("tasks/", back.apps.language_model.views.tasks.ListTasksAPI.as_view()),
+    path("query-llm/", back.apps.language_model.views.tasks.QueryLLM.as_view()),
     path("ray-status/", back.apps.language_model.views.tasks.RayStatusAPI.as_view()),
     path("retrieve/", back.apps.language_model.views.rag_pipeline.RetrieveAPI.as_view()),
 ]
@@ -1,13 +1,19 @@
+import asyncio
+import json
 from django.http import JsonResponse
-from rest_framework import status
+from django.views.decorators.csrf import csrf_exempt
+from django.utils.decorators import method_decorator
+from rest_framework import status, permissions
 from rest_framework.response import Response
 from back.apps.language_model.models import RayTaskState
 from back.apps.language_model.serializers.tasks import RayTaskStateSerializer
 from rest_framework.views import APIView
 from drf_spectacular.utils import extend_schema
 from django.conf import settings
-
-
+from django.views import View
+from back.apps.language_model.consumers import query_llm
+from back.apps.broker.serializers.rpc import RPCLLMRequestSerializer
+from back.config.middelware import KnoxAsyncAuthMixin
 
 def get_paginated_response(data, limit, offset, count):
     return JsonResponse({
@@ -61,7 +67,30 @@ def get(self, request):
             page = [task for task in page if task.get('task_id') == task_id]
 
         return get_paginated_response(page, limit, offset, len(data))
-    
+
+@method_decorator(csrf_exempt, name='dispatch')
+class QueryLLM(KnoxAsyncAuthMixin, View):
+    async def post(self, request):
+        body_data = json.loads(request.body.decode('utf-8'))
+        serializer = RPCLLMRequestSerializer(data=body_data)
+
+        if not serializer.is_valid():
+            return Response(serializer.errors, status=status.HTTP_400_BAD_REQUEST)
+
+        data = serializer.validated_data
+        llm_config_name = data.pop("llm_config_name")
+        conversation_id = data.pop("conversation_id")
+        data.pop("bot_channel_name", None)
+
+        res = None
+        async for _res in query_llm(
+            llm_config_name,
+            conversation_id,
+            **data
+        ):
+            res = _res
+
+        return JsonResponse(res, safe=False, status=status.HTTP_200_OK)
 
 class RayStatusAPI(APIView):
     @extend_schema(
 
@@ -12,6 +12,11 @@
 from back.apps.widget.models import Widget
 from urllib.parse import urlparse
 
+from functools import wraps
+from asgiref.sync import sync_to_async
+from knox.auth import TokenAuthentication
+from django.http import JsonResponse
+
 logger = getLogger(__name__)
 
 
@@ -90,3 +95,24 @@ def has_permission(self, request, view):
         if fnmatch.fnmatch(urlparse(origin).netloc, widget.domain):
             return True
         return False
+
+class KnoxAsyncAuthMixin:
+    """Mixin to add Knox authentication to async class-based views."""
+
+    async def dispatch(self, request, *args, **kwargs):
+        knox_auth = TokenAuthentication()
+
+        async def authenticate_async():
+            try:
+                return await sync_to_async(knox_auth.authenticate)(request)
+            except Exception as e:
+                return None
+
+        auth_result = await authenticate_async()
+
+        if auth_result:
+            request.user = auth_result[0]
+            request.auth = auth_result[1]
+            return await super().dispatch(request, *args, **kwargs)
+        else:
+            return JsonResponse({"error": "Authentication failed"}, status=401)
@@ -125,7 +125,7 @@ def pre_logging(self, env: EnvManager):
         return super().pre_logging(env)
 
 
-model_w_django = CustomPreset(enable_storages=not LOCAL_STORAGE, enable_celery=False)
+model_w_django = CustomPreset(enable_storages=not LOCAL_STORAGE, enable_celery=False, enable_wagtail=False)
 
 with EnvManager(model_w_django) as env:
     # ---
Original file line number	Diff line number	Diff line change
`@@ -32,6 +32,7 @@ apply_fixtures:`
`32`	`32`	`celery_worker:`
`33`	`33`	`$(POETRY_RUN) celery -A back.config worker -l INFO -P solo`
`34`	`34`
	`35`	`+#`
`35`	`36`	`# create_fsm_fixtures:`
`36`	`37`	`# ./manage.py dumpdata fsm.fsmdefinition --indent 4 > back/apps/fsm/fixtures/initial.json`
`37`	`38`	`#`
Original file line number	Diff line number	Diff line change
`@@ -21,6 +21,7 @@`
`21`	`21`
`22`	`22`	`urlpatterns += [`
`23`	`23`	`path("tasks/", back.apps.language_model.views.tasks.ListTasksAPI.as_view()),`
	`24`	`+ path("query-llm/", back.apps.language_model.views.tasks.QueryLLM.as_view()),`
`24`	`25`	`path("ray-status/", back.apps.language_model.views.tasks.RayStatusAPI.as_view()),`
`25`	`26`	`path("retrieve/", back.apps.language_model.views.rag_pipeline.RetrieveAPI.as_view()),`
`26`	`27`	`]`