From 61d16f6b8124936d0ce6861a4719fb8b9de0a2c0 Mon Sep 17 00:00:00 2001
From: Android PowerUser <88908510+Android-PowerUser@users.noreply.github.com>
Date: Mon, 30 Mar 2026 18:12:16 +0200
Subject: [PATCH 1/4] Adjust Mistral retry scheduling for per-key 1.1s cooldown

---
 .../multimodal/PhotoReasoningViewModel.kt     | 158 ++++++++++++------
 1 file changed, 111 insertions(+), 47 deletions(-)

diff --git a/app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt b/app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt
index 0f5cf0e..e4d62fd 100644
--- a/app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt
+++ b/app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt
@@ -70,6 +70,7 @@ import kotlinx.serialization.modules.subclass
 import com.google.ai.sample.webrtc.WebRTCSender
 import com.google.ai.sample.webrtc.SignalingClient
 import org.webrtc.IceCandidate
+import kotlin.math.max
 
 class PhotoReasoningViewModel(
     application: Application,
@@ -182,9 +183,11 @@ class PhotoReasoningViewModel(
     // to avoid re-executing already-executed commands
     private var incrementalCommandCount = 0
 
-    // Mistral rate limiting: track last request time to enforce 1-second minimum interval
-    private var lastMistralRequestTimeMs = 0L
-    private val MISTRAL_MIN_INTERVAL_MS = 1000L
+    // Mistral rate limiting per API key (1.1 seconds between requests with same key)
+    private val mistralNextAllowedRequestAtMsByKey = mutableMapOf<String, Long>()
+    private var lastMistralTokenTimeMs = 0L
+    private var lastMistralTokenKey: String? = null
+    private val MISTRAL_MIN_INTERVAL_MS = 1100L
 
     // Accumulated full text during streaming for incremental command parsing
     private var streamingAccumulatedText = StringBuilder()
@@ -1052,12 +1055,6 @@ private fun reasonWithMistral(
     resetStreamingCommandState()
 
     viewModelScope.launch(Dispatchers.IO) {
-        // Rate limiting: nur die verbleibende Zeit warten
-        val elapsed = System.currentTimeMillis() - lastMistralRequestTimeMs
-        if (lastMistralRequestTimeMs > 0 && elapsed < MISTRAL_MIN_INTERVAL_MS) {
-            delay(MISTRAL_MIN_INTERVAL_MS - elapsed)
-        }
-
         try {
             val currentModel = com.google.ai.sample.GenerativeAiViewModelFactory.getCurrentModel()
             val genSettings = com.google.ai.sample.util.GenerationSettingsPreferences.loadSettings(context, currentModel.modelName)
@@ -1126,60 +1123,127 @@ private fun reasonWithMistral(
                 .addHeader("Authorization", "Bearer $key")
                 .build()
 
-            var currentKey = initialApiKey
-            var response = client.newCall(buildRequest(currentKey)).execute()
-            lastMistralRequestTimeMs = System.currentTimeMillis()
+            val availableKeys = apiKeyManager.getApiKeys(ApiProvider.MISTRAL)
+                .filter { it.isNotBlank() }
+                .distinct()
+            if (availableKeys.isEmpty()) {
+                throw IOException("Mistral API key not found.")
+            }
 
-            if (response.code == 429) {
-                response.close()
-                apiKeyManager.markKeyAsFailed(currentKey, ApiProvider.MISTRAL)
-                val nextKey = apiKeyManager.switchToNextAvailableKey(ApiProvider.MISTRAL)
-                if (nextKey != null && nextKey != currentKey) {
-                    // Anderer Key verfugbar -> sofort wechseln wie bisher
-                    currentKey = nextKey
-                    val elapsed2 = System.currentTimeMillis() - lastMistralRequestTimeMs
-                    if (elapsed2 < MISTRAL_MIN_INTERVAL_MS) delay(MISTRAL_MIN_INTERVAL_MS - elapsed2)
-                    response = client.newCall(buildRequest(currentKey)).execute()
-                    lastMistralRequestTimeMs = System.currentTimeMillis()
-                } else {
-                    // Kein anderer Key -> 5 Sekunden lang sofort wiederholen
-                    apiKeyManager.resetFailedKeys(ApiProvider.MISTRAL)
+            fun markKeyCooldown(key: String, referenceTimeMs: Long) {
+                val nextAllowedAt = referenceTimeMs + MISTRAL_MIN_INTERVAL_MS
+                val existing = mistralNextAllowedRequestAtMsByKey[key] ?: 0L
+                mistralNextAllowedRequestAtMsByKey[key] = max(existing, nextAllowedAt)
+            }
+
+            fun remainingWaitForKeyMs(key: String, nowMs: Long): Long {
+                val nextAllowedAt = mistralNextAllowedRequestAtMsByKey[key] ?: 0L
+                return (nextAllowedAt - nowMs).coerceAtLeast(0L)
+            }
+
+            fun isRetryableMistralFailure(code: Int): Boolean {
+                return code == 429 || code >= 500
+            }
+
+            var response: okhttp3.Response? = null
+            var selectedKeyForResponse: String? = null
+            var consecutiveFailures = 0
+            var blockedKeysThisRound = mutableSetOf<String>()
+
+            while (response == null && consecutiveFailures < 5) {
+                if (stopExecutionFlag.get()) break
+
+                val now = System.currentTimeMillis()
+                val keyPool = availableKeys.filter { it !in blockedKeysThisRound }.ifEmpty {
+                    blockedKeysThisRound.clear()
+                    availableKeys
+                }
+
+                val keyWithLeastWait = keyPool.minByOrNull { remainingWaitForKeyMs(it, now) } ?: availableKeys.first()
+                val waitMs = remainingWaitForKeyMs(keyWithLeastWait, now)
+                if (waitMs > 0L) {
+                    delay(waitMs)
+                }
+
+                val selectedKey = keyWithLeastWait
+                selectedKeyForResponse = selectedKey
+
+                try {
+                    val attemptResponse = client.newCall(buildRequest(selectedKey)).execute()
+                    val requestEndMs = System.currentTimeMillis()
+                    markKeyCooldown(selectedKey, requestEndMs)
+
+                    if (attemptResponse.isSuccessful) {
+                        response = attemptResponse
+                        break
+                    }
+
+                    val isRetryable = isRetryableMistralFailure(attemptResponse.code)
+                    if (!isRetryable) {
+                        val errBody = attemptResponse.body?.string()
+                        attemptResponse.close()
+                        throw IllegalStateException("Mistral Error ${attemptResponse.code}: $errBody")
+                    }
+
+                    attemptResponse.close()
+                    blockedKeysThisRound.add(selectedKey)
+                    consecutiveFailures++
                     withContext(Dispatchers.Main) {
-                        replaceAiMessageText("Rate limit erreicht. Wiederhole...", isPending = true)
+                        replaceAiMessageText(
+                            "Mistral temporär nicht verfügbar (Versuch $consecutiveFailures/5). Wiederhole...",
+                            isPending = true
+                        )
                     }
-                    val retryDeadline = System.currentTimeMillis() + 5000L
-                    var retryResponse: okhttp3.Response? = null
-                    while (System.currentTimeMillis() < retryDeadline) {
-                        if (stopExecutionFlag.get()) break
-                        val retryResp = client.newCall(buildRequest(currentKey)).execute()
-                        lastMistralRequestTimeMs = System.currentTimeMillis()
-                        if (retryResp.code != 429) {
-                            retryResponse = retryResp
-                            break
-                        }
-                        retryResp.close()
+                } catch (e: IOException) {
+                    val requestEndMs = System.currentTimeMillis()
+                    markKeyCooldown(selectedKey, requestEndMs)
+                    blockedKeysThisRound.add(selectedKey)
+                    consecutiveFailures++
+                    if (consecutiveFailures >= 5) {
+                        throw IOException("Mistral request failed after 5 attempts: ${e.message}", e)
                     }
-                    if (retryResponse == null || stopExecutionFlag.get()) {
-                        throw IOException("Mistral rate limit: Kein Erfolg innerhalb von 5 Sekunden.")
+                    withContext(Dispatchers.Main) {
+                        replaceAiMessageText(
+                            "Mistral Netzwerkfehler (Versuch $consecutiveFailures/5). Wiederhole...",
+                            isPending = true
+                        )
                     }
-                    response = retryResponse
                 }
             }
 
-            if (!response.isSuccessful) {
-                val errBody = response.body?.string()
-                response.close()
-                throw IOException("Mistral Error ${response.code}: $errBody")
+            if (stopExecutionFlag.get()) {
+                throw IOException("Mistral request aborted.")
+            }
+
+            val finalResponse = response ?: throw IOException("Mistral request failed after 5 attempts.")
+
+            if (!finalResponse.isSuccessful) {
+                val errBody = finalResponse.body?.string()
+                finalResponse.close()
+                throw IOException("Mistral Error ${finalResponse.code}: $errBody")
             }
 
-            val body = response.body ?: throw IOException("Empty response body from Mistral")
+            val body = finalResponse.body ?: throw IOException("Empty response body from Mistral")
             val aiResponseText = openAiStreamParser.parse(body) { accText ->
+                selectedKeyForResponse?.let { key ->
+                    lastMistralTokenKey = key
+                    lastMistralTokenTimeMs = System.currentTimeMillis()
+                    markKeyCooldown(key, lastMistralTokenTimeMs)
+                }
                 withContext(Dispatchers.Main) {
                     replaceAiMessageText(accText, isPending = true)
                     processCommandsIncrementally(accText)
                 }
             }
-            response.close()
+            finalResponse.close()
+            selectedKeyForResponse?.let { key ->
+                val reference = if (lastMistralTokenKey == key && lastMistralTokenTimeMs > 0L) {
+                    lastMistralTokenTimeMs
+                } else {
+                    System.currentTimeMillis()
+                }
+                markKeyCooldown(key, reference)
+            }
 
             withContext(Dispatchers.Main) {
                 _uiState.value = PhotoReasoningUiState.Success(aiResponseText)

From 3cbeac1157ab1bb7e10293062b40670274576a0d Mon Sep 17 00:00:00 2001
From: Android PowerUser <88908510+Android-PowerUser@users.noreply.github.com>
Date: Mon, 30 Mar 2026 18:24:19 +0200
Subject: [PATCH 2/4] Update
 app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt

Co-authored-by: amazon-q-developer[bot] <208079219+amazon-q-developer[bot]@users.noreply.github.com>
---
 .../ai/sample/feature/multimodal/PhotoReasoningViewModel.kt     | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt b/app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt
index e4d62fd..a0ca20f 100644
--- a/app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt
+++ b/app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt
@@ -1229,6 +1229,8 @@ private fun reasonWithMistral(
                     lastMistralTokenKey = key
                     lastMistralTokenTimeMs = System.currentTimeMillis()
                     markKeyCooldown(key, lastMistralTokenTimeMs)
+                } ?: run {
+                    Log.w(TAG, "selectedKeyForResponse is null during streaming callback")
                 }
                 withContext(Dispatchers.Main) {
                     replaceAiMessageText(accText, isPending = true)

From e89c4504a29f4877e8a734fec3430732d954e37d Mon Sep 17 00:00:00 2001
From: Android PowerUser <88908510+Android-PowerUser@users.noreply.github.com>
Date: Mon, 30 Mar 2026 18:25:18 +0200
Subject: [PATCH 3/4] Update
 app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt

Co-authored-by: amazon-q-developer[bot] <208079219+amazon-q-developer[bot]@users.noreply.github.com>
---
 .../ai/sample/feature/multimodal/PhotoReasoningViewModel.kt    | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt b/app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt
index a0ca20f..f930966 100644
--- a/app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt
+++ b/app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt
@@ -1130,6 +1130,9 @@ private fun reasonWithMistral(
                 throw IOException("Mistral API key not found.")
             }
 
+            // Validate that we have at least one key before proceeding
+            require(availableKeys.isNotEmpty()) { "No valid Mistral API keys available after filtering" }
+
             fun markKeyCooldown(key: String, referenceTimeMs: Long) {
                 val nextAllowedAt = referenceTimeMs + MISTRAL_MIN_INTERVAL_MS
                 val existing = mistralNextAllowedRequestAtMsByKey[key] ?: 0L

From d139fcc4676cab32dc5b52ef8b1bb5be37363393 Mon Sep 17 00:00:00 2001
From: "amazon-q-developer[bot]"
 <208079219+amazon-q-developer[bot]@users.noreply.github.com>
Date: Mon, 30 Mar 2026 16:28:34 +0000
Subject: [PATCH 4/4] [skip ci] Fix Mistral API retry logic and error handling

- Add null safety check for selectedKeyForResponse in streaming callback
- Distinguish between network failures and HTTP errors in IOException handling
- Improve retry loop to cycle through all available keys before hitting failure limit
- Update retry attempt messages to reflect dynamic max attempts calculation
---
 .../feature/multimodal/PhotoReasoningViewModel.kt   | 13 +++++++------
 1 file changed, 7 insertions(+), 6 deletions(-)

diff --git a/app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt b/app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt
index f930966..002cb2a 100644
--- a/app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt
+++ b/app/src/main/kotlin/com/google/ai/sample/feature/multimodal/PhotoReasoningViewModel.kt
@@ -1153,7 +1153,8 @@ private fun reasonWithMistral(
             var consecutiveFailures = 0
             var blockedKeysThisRound = mutableSetOf<String>()
 
-            while (response == null && consecutiveFailures < 5) {
+            val maxAttempts = availableKeys.size * 2 + 3 // Allow cycling through all keys at least twice
+            while (response == null && consecutiveFailures < maxAttempts) {
                 if (stopExecutionFlag.get()) break
 
                 val now = System.currentTimeMillis()
@@ -1193,7 +1194,7 @@ private fun reasonWithMistral(
                     consecutiveFailures++
                     withContext(Dispatchers.Main) {
                         replaceAiMessageText(
-                            "Mistral temporär nicht verfügbar (Versuch $consecutiveFailures/5). Wiederhole...",
+                            "Mistral temporär nicht verfügbar (Versuch $consecutiveFailures/$maxAttempts). Wiederhole...",
                             isPending = true
                         )
                     }
@@ -1207,12 +1208,12 @@ private fun reasonWithMistral(
                     }
                     withContext(Dispatchers.Main) {
                         replaceAiMessageText(
-                            "Mistral Netzwerkfehler (Versuch $consecutiveFailures/5). Wiederhole...",
-                            isPending = true
+                        if (consecutiveFailures >= maxAttempts) {
+                            throw IOException("Mistral request failed after $maxAttempts attempts: ${e.message}", e)
                         )
                     }
                 }
-            }
+                                "Mistral Netzwerkfehler (Versuch $consecutiveFailures/$maxAttempts). Wiederhole...",
 
             if (stopExecutionFlag.get()) {
                 throw IOException("Mistral request aborted.")
@@ -1223,7 +1224,7 @@ private fun reasonWithMistral(
             if (!finalResponse.isSuccessful) {
                 val errBody = finalResponse.body?.string()
                 finalResponse.close()
-                throw IOException("Mistral Error ${finalResponse.code}: $errBody")
+            val finalResponse = response ?: throw IOException("Mistral request failed after $maxAttempts attempts.")
             }
 
             val body = finalResponse.body ?: throw IOException("Empty response body from Mistral")