ChatFAQ
diff --git a/‎.gitignore‎
Lines changed: 2 additions & 1 deletion b/‎.gitignore‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎Dogefile‎
Lines changed: 9 additions & 9 deletions b/‎Dogefile‎
Lines changed: 9 additions & 9 deletions
diff --git a/‎admin/nuxt.config.js‎
Lines changed: 3 additions & 0 deletions b/‎admin/nuxt.config.js‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎back/back/apps/broker/consumers/bots/custom_ws.py‎
Lines changed: 5 additions & 1 deletion b/‎back/back/apps/broker/consumers/bots/custom_ws.py‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎back/back/apps/broker/serializers/messages/custom_ws.py‎
Lines changed: 7 additions & 1 deletion b/‎back/back/apps/broker/serializers/messages/custom_ws.py‎
Lines changed: 7 additions & 1 deletion
diff --git a/‎back/back/apps/broker/views/__init__.py‎
Lines changed: 12 additions & 6 deletions b/‎back/back/apps/broker/views/__init__.py‎
Lines changed: 12 additions & 6 deletions
diff --git a/‎back/back/apps/health/checks.py‎
Lines changed: 157 additions & 42 deletions b/‎back/back/apps/health/checks.py‎
Lines changed: 157 additions & 42 deletions
diff --git a/‎back/back/apps/health/migrations/0001_initial.py‎
Lines changed: 1 addition & 2 deletions b/‎back/back/apps/health/migrations/0001_initial.py‎
Lines changed: 1 addition & 2 deletions
@@ -250,4 +250,5 @@ back/models/
 *.ipynb
 chat_rag/data/
 chat_rag/examples/
-*/.ragatouille/*
+*/.ragatouille/*
+/back/dump.rdb
@@ -113,15 +113,15 @@ workers:
     envs: [ sdk ]
     instance_size: XS
 
-#  - name: ray
-#    image:
-#      host: docker.io
-#      registry: chatfaq
-#      repository: back-chatrag
-#      tag: "develop"
-#    envs: [ django, ray_worker ]
-#    instance_size: L
-#    command: /.venv/bin/ray start --address=back:6375 --resources='{"tasks":100,"ai_components":100}' --block
+  - name: ray
+    image:
+      host: docker.io
+      registry: chatfaq
+      repository: back-chatrag
+      tag: "develop"
+    envs: [ django, ray_worker ]
+    instance_size: XXL
+    command: /.venv/bin/ray start --address=back:6375 --resources='{"tasks":100,"ai_components":100}' --block
 
 jobs:
   - name: migrate
 
@@ -23,6 +23,9 @@ export default envManager((env) => {
     });
     const viteNuxtConfig = defineNuxtConfig({
         ssr: true,
+        devServer: {
+            port: process.env.NUXT_PORT || 3000,
+        },
         css: ["@/assets/styles/global.scss"],
         buildModules: [],
         modules: [...config.modules, "@pinia/nuxt", "@element-plus/nuxt"],
 
@@ -27,7 +27,11 @@ async def gather_fsm_def(self):
         return fsm, None if fsm else f"`No FSM found with name {name}`"
 
     async def gather_user_id(self):
-        return self.scope["url_route"]["kwargs"]["sender_id"]
+        # If user is authenticated, use their sender_uuid
+        if self.scope.get("user") and self.scope["user"].is_authenticated:
+            return str(self.scope["user"].sender_uuid)
+        # Otherwise, fall back to URL parameter
+        return self.scope["url_route"]["kwargs"].get("sender_id")
 
     async def gather_initial_conversation_metadata(self):
         params = parse_qs(self.scope["query_string"])
 
@@ -29,10 +29,16 @@ def to_mml(self, ctx: BotConsumer) -> Union[bool, "Message"]:
         if not self.is_valid():
             return False
 
+        sender_data = self.data["sender"].copy()
+
+        # If user is authenticated, use their sender_uuid as the sender ID
+        if ctx.scope.get("user") and ctx.scope["user"].is_authenticated:
+            sender_data["id"] = str(ctx.scope["user"].sender_uuid)
+
         s = MessageSerializer(
             data={
                 "stack": self.data["stack"],
-                "sender": self.data["sender"],
+                "sender": sender_data,
                 "send_time": int(time.time() * 1000),
                 "conversation": ctx.conversation.pk,
             }
 
@@ -100,13 +100,19 @@ def instance_permissions(self, request):
 
     @action(methods=("get",), detail=False, permission_classes=[AllowAny])
     def from_sender(self, request, *args, **kwargs):
-        if not request.query_params.get("sender"):
-            return JsonResponse(
-                {"error": "sender is required"},
-                status=400,
-            )
+        # Use authenticated user's sender_uuid if available, otherwise fall back to query param
+        if request.user.is_authenticated:
+            sender_id = str(request.user.sender_uuid)
+        else:
+            sender_id = request.query_params.get("sender")
+            if not sender_id:
+                return JsonResponse(
+                    {"error": "sender is required"},
+                    status=400,
+                )
+
         results = []
-        for c in Conversation.conversations_from_sender(request.query_params.get("sender")):
+        for c in Conversation.conversations_from_sender(sender_id):
             if error := self._instance_permissions(c, request):
                 return error
             results.append(ConversationSerializer(c).data)
 
@@ -1,18 +1,23 @@
-from collections.abc import Mapping, Sequence
+import contextlib
+import io
+import logging
+from typing import Mapping, Sequence
 
 from asgiref.sync import async_to_sync
 from django.conf import settings
 from health_check.cache.backends import CacheBackend
-from health_check.contrib.psutil.backends import MemoryUsage
 from health_check.db.backends import (
+    BaseHealthCheckBackend,
     DatabaseBackend,
     ServiceUnavailable,
-    BaseHealthCheckBackend,
 )
 
 from .base import DjangoHealthCheckWrapper, HealthCheck, Outcome, Status
 from .models import Event
 
+# Get a logger instance
+logger = logging.getLogger(__name__)
+
 
 def disp_window(window: Mapping[str, int]) -> str:
     """
@@ -104,41 +109,6 @@ def get_name(self) -> str:
         return "Database"
 
 
-class RamUsage(DjangoHealthCheckWrapper):
-    """
-    Checks that we don't use too much RAM
-    """
-
-    base_class = MemoryUsage
-
-    def get_name(self) -> str:
-        return "RAM Usage"
-
-    def get_resolving_actions(self, outcome: Outcome) -> str:
-        return """# __CODE__ &mdash; RAM usage is too high
-
-The memory usage in the container running the application is too high.
-
-## Possible causes
-
-- There is a memory leak in the application
-- The application just needs more RAM
-
-## Possible solutions
-
-- Short term, restart the container
-- Long term, identify if this issue comes from a leak (in which case you can
-  fix the leak) or if the application just needs more RAM (in which case you
-  can increase the RAM allocated to the container)
-"""
-
-    def suggest_reboot(self, outcome: Outcome) -> Sequence[str]:
-        return ["api"]
-
-
-# :: IF api__redis
-
-
 class Cache(DjangoHealthCheckWrapper):
     """
     Validates cache accessibility. Since the queue is also the cache, it will
@@ -172,9 +142,6 @@ def suggest_reboot(self, outcome: Outcome) -> Sequence[str]:
         return ["redis"]
 
 
-# :: ENDIF
-
-
 class ProcrastinateBuiltInHealthCheck(BaseHealthCheckBackend):
     """
     Health check for Procrastinate task processor.
@@ -201,8 +168,8 @@ def check_status(self):
         Use the built-in healthchecks to check if the Procrastinate app is
         working.
         """
-        from procrastinate.contrib.django.healthchecks import healthchecks
         from procrastinate import exceptions
+        from procrastinate.contrib.django.healthchecks import healthchecks
 
         try:
             async_to_sync(healthchecks)(app=self.app)
@@ -252,3 +219,151 @@ def get_resolving_actions(self, outcome: Outcome) -> str:
 
     def suggest_reboot(self, outcome: Outcome) -> Sequence[str]:
         return ["procrastinate_worker"]
+
+
+class ModuleSimulationBase(HealthCheck):
+    """
+    Base class for module simulation health checks.
+    Checks the status by looking at the results of the last periodic task run.
+    """
+
+    MODULE_NUMBER = None
+    MODULE_NAME = None
+    WINDOW = dict(hours=7)
+
+    def get_name(self) -> str:
+        return f"{self.MODULE_NAME} Simulation"
+
+
+    def get_status(self) -> Outcome:
+        """
+        Checks the status of the module simulation based on the latest event
+        recorded by the periodic Procrastinate task.
+        """
+        event_type = f"module_{self.MODULE_NUMBER}_simulation"
+        stats = Event.objects.type(event_type).within(**self.WINDOW).stats()
+        stats_str = disp_stats(stats)
+
+        if stats["total"] == 0:
+            # No events found, means the task likely didn't run
+            outcome = dict(
+                status=Status.ERROR,
+                message=f"No simulation task events found in the last {disp_window(self.WINDOW)}",
+            )
+        elif stats["failure"]:
+            outcome = dict(
+                status=Status.ERROR,
+                message=f"{stats_str} in the last {disp_window(self.WINDOW)}",
+            )
+        else:
+            outcome = dict(
+                status=Status.OK,
+                message=f"{stats_str} in the last {disp_window(self.WINDOW)}",
+            )
+
+        return Outcome(
+            instance=self,
+            **outcome,
+        )
+
+    def get_resolving_actions(self, outcome: Outcome) -> str:
+        # Adjust the explanation slightly
+        return f"""# __CODE__ &mdash; {self.MODULE_NAME} Simulation Task Failed or Delayed
+
+This check verifies the status of the last background task run for the {self.MODULE_NAME} simulation.
+The background task simulates a file generation via WebSocket to verify:
+- The WebSocket server is reachable.
+- The FSM works correctly.
+- The FastAPI modules server is reachable.
+- The file generation LLM is reachable.
+- The file storage is reachable.
+
+## Possible Causes for ERROR/WARNING:
+
+- **Network Connectivity:** Issues connecting to the WebSocket server, module server, LLM, or storage.
+- **Base File Missing:** The required input file (`health_check_files/...`) might be missing from storage.
+- **Module/FSM Logic Error:** An error within the specific module's logic or the FSM definition.
+- **Resource Exhaustion:** The simulation task might be timing out due to resource limits (CPU, RAM).
+- The LLM API keys might be invalid or the LLM provider is down.
+"""
+
+    def suggest_reboot(self, outcome: Outcome) -> Sequence[str]:
+        return ["fsm", "module server"]
+
+
+class Module1Simulation(ModuleSimulationBase):
+    """
+    Simulates a file generation with module 1 of the chatbot to check if
+    WebSocket connection, message processing and file generation are working correctly.
+    """
+
+    MODULE_NUMBER = 1
+    MODULE_NAME = "Info2ArticleXia"
+
+
+class Module2Simulation(ModuleSimulationBase):
+    """
+    Simulates a file generation with module 2 of the chatbot to check if
+    WebSocket connection, message processing and file generation are working correctly.
+    """
+
+    MODULE_NUMBER = 2
+    MODULE_NAME = "TopicsIndexGenXia"
+
+
+class Module3Simulation(ModuleSimulationBase):
+    """
+    Simulates a file generation with module 3 of the chatbot to check if
+    WebSocket connection, message processing and file generation are working correctly.
+    """
+
+    MODULE_NUMBER = 3
+    MODULE_NAME = "ColAgreeSumXia"
+
+
+class LLMCheck(HealthCheck):
+    """
+    Validates that the enabled LLM are working correctly.
+    """
+
+    WINDOW = dict(hours=1)
+
+    def get_name(self) -> str:
+        return "LLM Check"
+
+    def get_status(self) -> Outcome:
+        events = Event.objects.types(["llm_call_complete", "llm_call_start"]).within(
+            **self.WINDOW
+        )
+        stats = events.stats()
+        stats_str = disp_stats(stats)
+
+        if stats["failure"]:
+            errors = [e.data for e in events.filter(is_success=False)]
+            return Outcome(
+                instance=self,
+                status=Status.ERROR,
+                message=f"{stats_str} in the last {disp_window(self.WINDOW)}",
+                extra={"errors": errors},
+            )
+        else:
+            return Outcome(
+                instance=self,
+                status=Status.OK,
+                message=f"{stats_str} in the last {disp_window(self.WINDOW)}",
+            )
+
+    def get_resolving_actions(self, outcome: Outcome) -> str:
+        return """# __CODE__ &mdash; LLM failed
+
+This check validates that the enabled LLM are working correctly.
+
+## Possible causes
+
+- The API key is invalid.
+- The defined endpoint url is invalid.
+- The model provider is down.
+"""
+
+    def suggest_reboot(self, outcome: Outcome) -> Sequence[str]:
+        return []
@@ -1,10 +1,9 @@
-# Generated by Django 5.1.6 on 2025-02-21 23:49
+# Generated by Django 4.1.7 on 2023-12-12 14:17
 
 from django.db import migrations, models
 
 
 class Migration(migrations.Migration):
-
     initial = True
 
     dependencies = []