SarmaHighOnCode
diff --git a/‎backend/app/api/routes/generate.py‎
Lines changed: 11 additions & 9 deletions b/‎backend/app/api/routes/generate.py‎
Lines changed: 11 additions & 9 deletions
diff --git a/‎backend/app/main.py‎
Lines changed: 1 addition & 0 deletions b/‎backend/app/main.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎backend/app/ml/dataset.py‎
Lines changed: 8 additions & 6 deletions b/‎backend/app/ml/dataset.py‎
Lines changed: 8 additions & 6 deletions
diff --git a/‎backend/app/ml/llm_engine.py‎
Lines changed: 16 additions & 6 deletions b/‎backend/app/ml/llm_engine.py‎
Lines changed: 16 additions & 6 deletions
diff --git a/‎backend/app/ml/model.py‎
Lines changed: 10 additions & 13 deletions b/‎backend/app/ml/model.py‎
Lines changed: 10 additions & 13 deletions
diff --git a/‎backend/app/ml/utils.py‎
Lines changed: 18 additions & 14 deletions b/‎backend/app/ml/utils.py‎
Lines changed: 18 additions & 14 deletions
@@ -44,8 +44,7 @@ def _cleanup_old_jobs() -> None:
 
     now = time.monotonic()
     expired = [
-        jid for jid, job in _jobs.items()
-        if now - job.get("created_at", now) > _JOB_TTL_SECONDS
+        jid for jid, job in _jobs.items() if now - job.get("created_at", now) > _JOB_TTL_SECONDS
     ]
     for jid in expired:
         del _jobs[jid]
@@ -106,8 +105,7 @@ async def generate_handwriting(
     stream_url = f"{base_url}/api/stream/{job_id}"
 
     logger.info(
-        f"Job {job_id} created: {len(request_body.text)} chars, "
-        f"style={request_body.style_id}"
+        f"Job {job_id} created: {len(request_body.text)} chars, style={request_body.style_id}"
     )
 
     return GenerateResponse(
@@ -150,7 +148,9 @@ async def websocket_stream(websocket: WebSocket, job_id: str) -> None:
         return
 
     if not engine.is_ready:
-        await websocket.send_json({"type": "error", "message": "Engine not ready — model still loading"})
+        await websocket.send_json(
+            {"type": "error", "message": "Engine not ready — model still loading"}
+        )
         await websocket.close(code=4003)
         return
 
@@ -285,10 +285,12 @@ async def event_generator():
             job["status"] = "failed"
             job["error"] = str(e)
 
-            error_event = json.dumps({
-                "type": "error",
-                "message": str(e),
-            })
+            error_event = json.dumps(
+                {
+                    "type": "error",
+                    "message": str(e),
+                }
+            )
             yield f"data: {error_event}\n\n"
 
     return StreamingResponse(
 
@@ -33,6 +33,7 @@
 # Lifespan — Load model ONCE on startup, release on shutdown
 # ============================================================
 
+
 @asynccontextmanager
 async def lifespan(app: FastAPI) -> AsyncGenerator[None, None]:
     """
 
@@ -132,11 +132,13 @@ def _load_from_stroke_files(self, split: str) -> list[dict]:
                 else:
                     text_str = str(text_val)
 
-                samples.append({
-                    "strokes": data["strokes"].tolist(),
-                    "text": text_str,
-                    "writer_id": writer_id,
-                })
+                samples.append(
+                    {
+                        "strokes": data["strokes"].tolist(),
+                        "text": text_str,
+                        "writer_id": writer_id,
+                    }
+                )
             except Exception:
                 # Skip files that cannot be loaded without pickle or have other errors
                 continue
@@ -344,7 +346,7 @@ def parse_iam_xml(xml_path: Path) -> list[tuple[float, float, int, int, int]]:
     for i, (x, y, pen_down) in enumerate(abs_points):
         dx = x - prev_x
         dy = y - prev_y
-        is_last = (i == len(abs_points) - 1)
+        is_last = i == len(abs_points) - 1
 
         if is_last:
             p1, p2, p3 = 0, 0, 1  # end-of-sequence
 
@@ -37,8 +37,10 @@
 # Engine Configuration
 # ============================================================
 
+
 class QuantizationMode(str, Enum):
     """Quantization strategy for model weights."""
+
     NONE = "fp16"
     INT8 = "int8"
     INT4 = "int4"
@@ -51,6 +53,7 @@ class EngineConfig:
     Maps directly to Settings fields — separated so the engine
     has no hard dependency on FastAPI/Pydantic.
     """
+
     model_name: str = "inkforge-lstm-mdn-v1"
     checkpoint_path: str = "checkpoints/lstm_mdn_v1_best.pt"
     device: str = "cpu"
@@ -66,6 +69,7 @@ class EngineConfig:
 @dataclass
 class EngineStatus:
     """Runtime status snapshot of the engine."""
+
     model_loaded: bool = False
     model_name: str = ""
     engine_backend: str = "mock"
@@ -87,6 +91,7 @@ class EngineStatus:
 # Singleton LLM Engine
 # ============================================================
 
+
 class LLMEngine:
     """
     Singleton engine that manages the lifecycle of the LSTM+MDN model.
@@ -179,10 +184,11 @@ async def initialize_model(self, config: EngineConfig) -> None:
             if config.device == "cuda":
                 try:
                     import torch
+
                     if torch.cuda.is_available():
                         self._gpu_name = torch.cuda.get_device_name(0)
                         self._vram_total_gb = round(
-                            torch.cuda.get_device_properties(0).total_memory / (1024 ** 3), 1
+                            torch.cuda.get_device_properties(0).total_memory / (1024**3), 1
                         )
                         logger.info(f"  → CUDA device found: {self._gpu_name}")
                         logger.info(f"  → Total VRAM: {self._vram_total_gb} GB")
@@ -272,6 +278,7 @@ async def shutdown(self) -> None:
             # Clear CUDA cache if available
             try:
                 import torch
+
                 if torch.cuda.is_available():
                     torch.cuda.empty_cache()
             except ImportError:
@@ -493,8 +500,12 @@ async def _stream_mock(
                 line_num += 1
 
             # Baseline drift (Exaggerated for visual awareness in mock mode)
-            global_drift = baseline_drift * 8.0 * math.sin(
-                2 * math.pi * line_num / max(total_words / 5.0, 3.0) + random.uniform(0, 0.5)
+            global_drift = (
+                baseline_drift
+                * 8.0
+                * math.sin(
+                    2 * math.pi * line_num / max(total_words / 5.0, 3.0) + random.uniform(0, 0.5)
+                )
             )
 
             char_x = cursor_x
@@ -543,7 +554,7 @@ async def _stream_mock(
                     char_x += dx
 
                     delay = config.stream_chunk_delay_ms / 1000.0
-                    delay *= random.uniform(0.2, 0.8) # faster for mock strokes
+                    delay *= random.uniform(0.2, 0.8)  # faster for mock strokes
                     await asyncio.sleep(delay)
 
             # Pen-up between words
@@ -580,8 +591,7 @@ async def _stream_mock(
         }
 
         logger.info(
-            f"[req-{request_id}] Complete (mock): "
-            f"{stroke_index} strokes, {line_num + 1} lines"
+            f"[req-{request_id}] Complete (mock): {stroke_index} strokes, {line_num + 1} lines"
         )
 
     # --------------------------------------------------------
 
@@ -89,7 +89,7 @@ def __init__(
         # Total per mixture: 6 parameters
         # Plus 3 pen state logits
         mdn_output_dim = num_mixtures * 6  # π, μx, μy, σx, σy, ρ
-        pen_state_dim = 3                  # p1, p2, p3
+        pen_state_dim = 3  # p1, p2, p3
 
         self.mdn_head = nn.Linear(hidden_dim, mdn_output_dim)
         self.pen_head = nn.Linear(hidden_dim, pen_state_dim)
@@ -163,18 +163,18 @@ def sample(
         # Each component has 6 params, total = M*6
         params = mdn_params.view(num_m, 6)
 
-        pi_logits = params[:, 0]          # Mixture weights (logits)
-        mu_x = params[:, 1]               # Mean x
-        mu_y = params[:, 2]               # Mean y
-        sigma_x = torch.exp(params[:, 3]) # Std x (exp to ensure positive)
-        sigma_y = torch.exp(params[:, 4]) # Std y
-        rho = torch.tanh(params[:, 5])    # Correlation (tanh to bound [-1, 1])
+        pi_logits = params[:, 0]  # Mixture weights (logits)
+        mu_x = params[:, 1]  # Mean x
+        mu_y = params[:, 2]  # Mean y
+        sigma_x = torch.exp(params[:, 3])  # Std x (exp to ensure positive)
+        sigma_y = torch.exp(params[:, 4])  # Std y
+        rho = torch.tanh(params[:, 5])  # Correlation (tanh to bound [-1, 1])
 
         # 2. Apply temperature
         # Scale mixture logits by 1/τ, scale sigmas by √τ
         pi = torch.softmax(pi_logits / temperature, dim=0)
-        sigma_x = sigma_x * (temperature ** 0.5)
-        sigma_y = sigma_y * (temperature ** 0.5)
+        sigma_x = sigma_x * (temperature**0.5)
+        sigma_y = sigma_y * (temperature**0.5)
 
         # 3. Sample mixture component from categorical distribution
         mixture_idx = torch.multinomial(pi, 1).item()
@@ -193,7 +193,7 @@ def sample(
         z2 = torch.randn(1).item()
 
         dx = mu_x_k + sigma_x_k * z1
-        dy = mu_y_k + sigma_y_k * (rho_k * z1 + (1 - rho_k ** 2) ** 0.5 * z2)
+        dy = mu_y_k + sigma_y_k * (rho_k * z1 + (1 - rho_k**2) ** 0.5 * z2)
 
         # 5. Sample pen state from Bernoulli
         pen_probs = torch.softmax(pen_logits / temperature, dim=0)
@@ -256,19 +256,16 @@ def __init__(self, style_dim: int = STYLE_DIM, input_channels: int = 1) -> None:
             nn.BatchNorm2d(32),
             nn.ReLU(inplace=True),
             nn.MaxPool2d(2, 2),
-
             # Block 2: 32 -> 64 channels
             nn.Conv2d(32, 64, kernel_size=3, padding=1),
             nn.BatchNorm2d(64),
             nn.ReLU(inplace=True),
             nn.MaxPool2d(2, 2),
-
             # Block 3: 64 -> 128 channels
             nn.Conv2d(64, 128, kernel_size=3, padding=1),
             nn.BatchNorm2d(128),
             nn.ReLU(inplace=True),
             nn.MaxPool2d(2, 2),
-
             # Block 4: 128 -> 256 channels
             nn.Conv2d(128, 256, kernel_size=3, padding=1),
             nn.BatchNorm2d(256),
 
@@ -32,18 +32,18 @@ def compute_mdn_loss(
         Scalar loss tensor.
     """
     batch_size, seq_len, _ = mdn_params.shape
-    num_m = num_mixtures # Renamed num_m to M for consistency with patch
+    num_m = num_mixtures  # Renamed num_m to M for consistency with patch
 
     # Reshape MDN params: [batch, seq, M*6] -> [batch, seq, M, 6]
     params = mdn_params.view(batch_size, seq_len, num_m, 6)
 
     # Extract parameters
-    pi_logits = params[:, :, :, 0]           # [batch, seq, M]
-    mu_x = params[:, :, :, 1]                # [batch, seq, M]
-    mu_y = params[:, :, :, 2]                # [batch, seq, M]
-    sigma_x_raw = params[:, :, :, 3]         # [batch, seq, M]
-    sigma_y_raw = params[:, :, :, 4]         # [batch, seq, M]
-    rho_raw = params[:, :, :, 5]             # [batch, seq, M]
+    pi_logits = params[:, :, :, 0]  # [batch, seq, M]
+    mu_x = params[:, :, :, 1]  # [batch, seq, M]
+    mu_y = params[:, :, :, 2]  # [batch, seq, M]
+    sigma_x_raw = params[:, :, :, 3]  # [batch, seq, M]
+    sigma_y_raw = params[:, :, :, 4]  # [batch, seq, M]
+    rho_raw = params[:, :, :, 5]  # [batch, seq, M]
 
     # Apply activations to ensure valid parameter ranges
     sigma_x = torch.exp(sigma_x_raw)
@@ -63,18 +63,18 @@ def compute_mdn_loss(
 
     dx = (target_x - mu_x) / sigma_x
     dy = (target_y - mu_y) / sigma_y
-    rho_sq = rho ** 2
+    rho_sq = rho**2
 
     # Avoid division by zero
     one_minus_rho_sq = (1 - rho_sq).clamp(min=1e-6)
 
-    z_val = dx ** 2 + dy ** 2 - 2 * rho * dx * dy # Corrected Z variable name from patch
+    z_val = dx**2 + dy**2 - 2 * rho * dx * dy  # Corrected Z variable name from patch
     log_gaussian = (
         -math.log(2 * math.pi)
-        - torch.log(sigma_x) # Changed from log_sigma_x
-        - torch.log(sigma_y) # Changed from log_sigma_y
+        - torch.log(sigma_x)  # Changed from log_sigma_x
+        - torch.log(sigma_y)  # Changed from log_sigma_y
         - 0.5 * torch.log(one_minus_rho_sq)
-        - z_val / (2 * one_minus_rho_sq) # Changed from Z to z_val
+        - z_val / (2 * one_minus_rho_sq)  # Changed from Z to z_val
     )  # [batch, seq, M]
 
     # Weighted sum using log-sum-exp: log(Σ π_k * N_k) = logsumexp(log π_k + log N_k)
@@ -86,7 +86,9 @@ def compute_mdn_loss(
     # Pen state loss: cross-entropy (target must be long/int64)
     pen_logits_flat = pen_logits.view(-1, 3)  # [batch*seq, 3]
     target_pen_flat = target_pen.long().view(-1)  # [batch*seq]
-    pen_loss = functional.cross_entropy(pen_logits_flat, target_pen_flat) # Corrected syntax from patch
+    pen_loss = functional.cross_entropy(
+        pen_logits_flat, target_pen_flat
+    )  # Corrected syntax from patch
 
     # Total loss
     total_loss = stroke_loss + pen_loss
@@ -176,7 +178,9 @@ def strokes_to_absolute(strokes: list[tuple[float, ...]]) -> list[tuple[float, f
     return absolute
 
 
-def absolute_to_strokes(points: list[tuple[float, float, int]]) -> list[tuple[float, float, int, int, int]]:
+def absolute_to_strokes(
+    points: list[tuple[float, float, int]],
+) -> list[tuple[float, float, int, int, int]]:
     """
     Convert absolute coordinates to relative stroke deltas.