/** * Shared combo (model combo) handling with fallback support */ import { checkFallbackError, formatRetryAfter } from "./accountFallback.js"; import { unavailableResponse } from "../utils/error.js"; /** * Track rotation state per combo (for round-robin strategy) * @type {Map} */ const comboRotationState = new Map(); /** * Get rotated model list based on strategy * @param {string[]} models - Array of model strings * @param {string} comboName - Name of the combo * @param {string} strategy - "fallback" or "round-robin" * @returns {string[]} Rotated models array */ export function getRotatedModels(models, comboName, strategy) { if (!models || models.length <= 1 || strategy !== "round-robin") { return models; } const currentIndex = comboRotationState.get(comboName) || 0; const rotatedModels = [...models]; // Rotate: move models from currentIndex to front, preserving order after for (let i = 0; i < currentIndex; i++) { const moved = rotatedModels.shift(); rotatedModels.push(moved); } // Update state for next request (cycle through all models) const nextIndex = (currentIndex + 1) % models.length; comboRotationState.set(comboName, nextIndex); return rotatedModels; } /** * Reset in-memory rotation state when combo/settings change * @param {string} [comboName] - Combo name to reset; omit to clear all */ export function resetComboRotation(comboName) { if (comboName) comboRotationState.delete(comboName); else comboRotationState.clear(); } /** * Get combo models from combos data * @param {string} modelStr - Model string to check * @param {Array|Object} combosData - Array of combos or object with combos * @returns {string[]|null} Array of models or null if not a combo */ export function getComboModelsFromData(modelStr, combosData) { // Don't check if it's in provider/model format if (modelStr.includes("/")) return null; // Handle both array and object formats const combos = Array.isArray(combosData) ? combosData : (combosData?.combos || []); const combo = combos.find(c => c.name === modelStr); if (combo && combo.models && combo.models.length > 0) { return combo.models; } return null; } /** * Handle combo chat with fallback * @param {Object} options * @param {Object} options.body - Request body * @param {string[]} options.models - Array of model strings to try * @param {Function} options.handleSingleModel - Function to handle single model: (body, modelStr) => Promise * @param {Object} options.log - Logger object * @param {string} [options.comboName] - Name of the combo (for round-robin tracking) * @param {string} [options.comboStrategy] - Strategy: "fallback" or "round-robin" * @returns {Promise} */ export async function handleComboChat({ body, models, handleSingleModel, log, comboName, comboStrategy }) { // Apply rotation strategy if enabled const rotatedModels = getRotatedModels(models, comboName, comboStrategy); let lastError = null; let earliestRetryAfter = null; let lastStatus = null; for (let i = 0; i < rotatedModels.length; i++) { const modelStr = rotatedModels[i]; log.info("COMBO", `Trying model ${i + 1}/${rotatedModels.length}: ${modelStr}`); try { const result = await handleSingleModel(body, modelStr); // Success (2xx) - return response if (result.ok) { log.info("COMBO", `Model ${modelStr} succeeded`); return result; } // Extract error info from response let errorText = result.statusText || ""; let retryAfter = null; try { const errorBody = await result.clone().json(); errorText = errorBody?.error?.message || errorBody?.error || errorBody?.message || errorText; retryAfter = errorBody?.retryAfter || null; } catch { // Ignore JSON parse errors } // Track earliest retryAfter across all combo models if (retryAfter && (!earliestRetryAfter || new Date(retryAfter) < new Date(earliestRetryAfter))) { earliestRetryAfter = retryAfter; } // Normalize error text to string (Worker-safe) if (typeof errorText !== "string") { try { errorText = JSON.stringify(errorText); } catch { errorText = String(errorText); } } // Check if should fallback to next model const { shouldFallback, cooldownMs } = checkFallbackError(result.status, errorText); if (!shouldFallback) { log.warn("COMBO", `Model ${modelStr} failed (no fallback)`, { status: result.status }); return result; } // For transient errors (503/502/504), wait for cooldown before falling through // so a briefly-overloaded provider gets a chance to recover rather than being // skipped immediately (fixes: combo falls through on transient 503) if (cooldownMs && cooldownMs > 0 && cooldownMs <= 5000 && (result.status === 503 || result.status === 502 || result.status === 504)) { log.info("COMBO", `Model ${modelStr} transient ${result.status}, waiting ${cooldownMs}ms before next`); await new Promise(r => setTimeout(r, cooldownMs)); } // Fallback to next model lastError = errorText || String(result.status); if (!lastStatus) lastStatus = result.status; log.warn("COMBO", `Model ${modelStr} failed, trying next`, { status: result.status }); } catch (error) { // Catch unexpected exceptions to ensure fallback continues lastError = error.message || String(error); if (!lastStatus) lastStatus = 500; log.warn("COMBO", `Model ${modelStr} threw error, trying next`, { error: lastError }); } } // All models failed // Use 503 (Service Unavailable) rather than 406 (Not Acceptable) — 406 implies // the request itself is invalid, but here the providers are simply unavailable // or have no active credentials. 503 is more accurate and retryable by clients. const allDisabled = lastError && lastError.toLowerCase().includes("no credentials"); const status = allDisabled ? 503 : (lastStatus || 503); const msg = lastError || "All combo models unavailable"; if (earliestRetryAfter) { const retryHuman = formatRetryAfter(earliestRetryAfter); log.warn("COMBO", `All models failed | ${msg} (${retryHuman})`); return unavailableResponse(status, msg, earliestRetryAfter, retryHuman); } log.warn("COMBO", `All models failed | ${msg}`); return new Response( JSON.stringify({ error: { message: msg } }), { status, headers: { "Content-Type": "application/json" } } ); }