diff --git a/bun.lock b/bun.lock
index 4a416c88d2..8591e18756 100644
--- a/bun.lock
+++ b/bun.lock
@@ -28,13 +28,13 @@
         "typescript": "^5.7.3",
       },
       "optionalDependencies": {
-        "oh-my-opencode-darwin-arm64": "3.3.1",
-        "oh-my-opencode-darwin-x64": "3.3.1",
-        "oh-my-opencode-linux-arm64": "3.3.1",
-        "oh-my-opencode-linux-arm64-musl": "3.3.1",
-        "oh-my-opencode-linux-x64": "3.3.1",
-        "oh-my-opencode-linux-x64-musl": "3.3.1",
-        "oh-my-opencode-windows-x64": "3.3.1",
+        "oh-my-opencode-darwin-arm64": "3.4.0",
+        "oh-my-opencode-darwin-x64": "3.4.0",
+        "oh-my-opencode-linux-arm64": "3.4.0",
+        "oh-my-opencode-linux-arm64-musl": "3.4.0",
+        "oh-my-opencode-linux-x64": "3.4.0",
+        "oh-my-opencode-linux-x64-musl": "3.4.0",
+        "oh-my-opencode-windows-x64": "3.4.0",
       },
     },
   },
@@ -226,19 +226,19 @@
 
     "object-inspect": ["object-inspect@1.13.4", "", {}, "sha512-W67iLl4J2EXEGTbfeHCffrjDfitvLANg0UlX3wFUUSTx92KXRFegMHUVgSqE+wvhAbi4WqjGg9czysTV2Epbew=="],
 
-    "oh-my-opencode-darwin-arm64": ["oh-my-opencode-darwin-arm64@3.3.1", "", { "os": "darwin", "cpu": "arm64", "bin": { "oh-my-opencode": "bin/oh-my-opencode" } }, "sha512-R+o42Km6bsIaW6D3I8uu2HCF3BjIWqa/fg38W5y4hJEOw4mL0Q7uV4R+0vtrXRHo9crXTK9ag0fqVQUm+Y6iAQ=="],
+    "oh-my-opencode-darwin-arm64": ["oh-my-opencode-darwin-arm64@3.4.0", "", { "os": "darwin", "cpu": "arm64", "bin": { "oh-my-opencode": "bin/oh-my-opencode" } }, "sha512-W0941HVUULa/1i4k6eE25PjfqfnnWKL8LKWfSzFNqbc7emmYWfxOnghw6nHdJVAzdVxwX3HSmZaHAFLCtJ4k0A=="],
 
-    "oh-my-opencode-darwin-x64": ["oh-my-opencode-darwin-x64@3.3.1", "", { "os": "darwin", "cpu": "x64", "bin": { "oh-my-opencode": "bin/oh-my-opencode" } }, "sha512-7VTbpR1vH3OEkoJxBKtYuxFPX8M3IbJKoeHWME9iK6FpT11W1ASsjyuhvzB1jcxSeqF8ddMnjitlG5ub6h5EVw=="],
+    "oh-my-opencode-darwin-x64": ["oh-my-opencode-darwin-x64@3.4.0", "", { "os": "darwin", "cpu": "x64", "bin": { "oh-my-opencode": "bin/oh-my-opencode" } }, "sha512-enwn1v1KjIaxGyTUNLrvRiTDItlIBme6LnKMbt8Fva5gX3CbfCJccmzjOEmKsFnv7y6TpkOll435revRwDCAUw=="],
 
-    "oh-my-opencode-linux-arm64": ["oh-my-opencode-linux-arm64@3.3.1", "", { "os": "linux", "cpu": "arm64", "bin": { "oh-my-opencode": "bin/oh-my-opencode" } }, "sha512-BZ/r/CFlvbOxkdZZrRoT16xFOjibRZHuwQnaE4f0JvOzgK6/HWp3zJI1+2/aX/oK5GA6lZxNWRrJC/SKUi8LEg=="],
+    "oh-my-opencode-linux-arm64": ["oh-my-opencode-linux-arm64@3.4.0", "", { "os": "linux", "cpu": "arm64", "bin": { "oh-my-opencode": "bin/oh-my-opencode" } }, "sha512-HybwgSRDBWuczdUMi/8NvRH7vMilG8Y0LKsL6xJmvRtdyleI2KAllQZLcQDK7+TfF1UKgQ+Z8c5lwLoFMTExRQ=="],
 
-    "oh-my-opencode-linux-arm64-musl": ["oh-my-opencode-linux-arm64-musl@3.3.1", "", { "os": "linux", "cpu": "arm64", "bin": { "oh-my-opencode": "bin/oh-my-opencode" } }, "sha512-U90Wruf21h+CJbtcrS7MeTAc/5VOF6RI+5jr7qj/cCxjXNJtjhyJdz/maehArjtgf304+lYCM/Mh1i+G2D3YFQ=="],
+    "oh-my-opencode-linux-arm64-musl": ["oh-my-opencode-linux-arm64-musl@3.4.0", "", { "os": "linux", "cpu": "arm64", "bin": { "oh-my-opencode": "bin/oh-my-opencode" } }, "sha512-SNhNSaa1+oS0u6yylqK17RCNgtXX7pRiKHaAd2CI2sQv6UF62Jjipabd6vt3QbpGhoXuVbk/L0schO5kSoEv5A=="],
 
-    "oh-my-opencode-linux-x64": ["oh-my-opencode-linux-x64@3.3.1", "", { "os": "linux", "cpu": "x64", "bin": { "oh-my-opencode": "bin/oh-my-opencode" } }, "sha512-sYzohSNdwsAhivbXcbhPdF1qqQi2CCI7FSgbmvvfBOMyZ8HAgqOFqYW2r3GPdmtywzkjOTvCzTG56FZwEjx15w=="],
+    "oh-my-opencode-linux-x64": ["oh-my-opencode-linux-x64@3.4.0", "", { "os": "linux", "cpu": "x64", "bin": { "oh-my-opencode": "bin/oh-my-opencode" } }, "sha512-OTRSxRl9Q4AiNtblZeR01zpgsEuApHEchtUIICQGCNb0BvvqdkR7yrj5GQcAdQRIqpSnzaM6Bl6QEb1uhznjPw=="],
 
-    "oh-my-opencode-linux-x64-musl": ["oh-my-opencode-linux-x64-musl@3.3.1", "", { "os": "linux", "cpu": "x64", "bin": { "oh-my-opencode": "bin/oh-my-opencode" } }, "sha512-aG5pZ4eWS0YSGUicOnjMkUPrIqQV4poYF+d9SIvrfvlaMcK6WlQn7jXzgNCwJsfGn5lyhSmjshZBEU+v79Ua3w=="],
+    "oh-my-opencode-linux-x64-musl": ["oh-my-opencode-linux-x64-musl@3.4.0", "", { "os": "linux", "cpu": "x64", "bin": { "oh-my-opencode": "bin/oh-my-opencode" } }, "sha512-c9EuGMNrsWUeB+h1BX1DfPIs5O+EVZq3YuadIfFgZAK+q/K/VLavEauhH7U748PxJsbFDS5L9SRP6u4Ui4t7lQ=="],
 
-    "oh-my-opencode-windows-x64": ["oh-my-opencode-windows-x64@3.3.1", "", { "os": "win32", "cpu": "x64", "bin": { "oh-my-opencode": "bin/oh-my-opencode.exe" } }, "sha512-FGH7cnzBqNwjSkzCDglMsVttaq+MsykAxa7ehaFK+0dnBZArvllS3W13a3dGaANHMZzfK0vz8hNDUdVi7Z63cA=="],
+    "oh-my-opencode-windows-x64": ["oh-my-opencode-windows-x64@3.4.0", "", { "os": "win32", "cpu": "x64", "bin": { "oh-my-opencode": "bin/oh-my-opencode.exe" } }, "sha512-yIl0COMWg3pjYmvTShurmliMUiTCi8VuGgKPcK7gZqpMsNH0UtCQiY9CGf9vJJeHhhzxH2HzCWI1yzTx1V+laA=="],
 
     "on-finished": ["on-finished@2.4.1", "", { "dependencies": { "ee-first": "1.1.1" } }, "sha512-oVlzkg3ENAhCk2zdv7IJwd/QUD4z2RxRwpkcGY8psCVcCYZNq4wYnVWALHM+brtuJjePWiYF/ClmuDr8Ch5+kg=="],
 
diff --git a/docs/configurations.md b/docs/configurations.md
index 2fb67bd475..a20d4a5e38 100644
--- a/docs/configurations.md
+++ b/docs/configurations.md
@@ -163,19 +163,20 @@ Override built-in agent settings:
 }
 ```
 
-Each agent supports: `model`, `temperature`, `top_p`, `prompt`, `prompt_append`, `tools`, `disable`, `description`, `mode`, `color`, `permission`, `category`, `variant`, `maxTokens`, `thinking`, `reasoningEffort`, `textVerbosity`, `providerOptions`.
+Each agent supports: `model`, `fallback_models`, `temperature`, `top_p`, `prompt`, `prompt_append`, `tools`, `disable`, `description`, `mode`, `color`, `permission`, `category`, `variant`, `maxTokens`, `thinking`, `reasoningEffort`, `textVerbosity`, `providerOptions`.
 
 ### Additional Agent Options
 
-| Option              | Type    | Description                                                                                     |
-| ------------------- | ------- | ----------------------------------------------------------------------------------------------- |
-| `category`          | string  | Category name to inherit model and other settings from category defaults                             |
-| `variant`           | string  | Model variant (e.g., `max`, `high`, `medium`, `low`, `xhigh`)                                 |
-| `maxTokens`         | number  | Maximum tokens for response. Passed directly to OpenCode SDK.                                      |
-| `thinking`          | object  | Extended thinking configuration for Anthropic models. See [Thinking Options](#thinking-options) below. |
-| `reasoningEffort`   | string  | OpenAI reasoning effort level. Values: `low`, `medium`, `high`, `xhigh`.                         |
-| `textVerbosity`      | string  | Text verbosity level. Values: `low`, `medium`, `high`.                                        |
-| `providerOptions`    | object  | Provider-specific options passed directly to OpenCode SDK.                                      |
+| Option              | Type           | Description                                                                                     |
+| ------------------- | -------------- | ----------------------------------------------------------------------------------------------- |
+| `fallback_models`   | string/array   | Fallback models for runtime switching on API errors. Single string or array of model strings.  |
+| `category`          | string         | Category name to inherit model and other settings from category defaults                        |
+| `variant`           | string         | Model variant (e.g., `max`, `high`, `medium`, `low`, `xhigh`)                                   |
+| `maxTokens`         | number         | Maximum tokens for response. Passed directly to OpenCode SDK.                                   |
+| `thinking`          | object         | Extended thinking configuration for Anthropic models. See [Thinking Options](#thinking-options) below. |
+| `reasoningEffort`   | string         | OpenAI reasoning effort level. Values: `low`, `medium`, `high`, `xhigh`.                        |
+| `textVerbosity`     | string         | Text verbosity level. Values: `low`, `medium`, `high`.                                          |
+| `providerOptions`   | object         | Provider-specific options passed directly to OpenCode SDK.                                      |
 
 #### Thinking Options (Anthropic)
 
@@ -714,6 +715,63 @@ Configure concurrency limits for background agent tasks. This controls how many
 - Allow more concurrent tasks for fast/cheap models (e.g., Gemini Flash)
 - Respect provider rate limits by setting provider-level caps
 
+## Runtime Fallback
+
+Automatically switch to backup models when the primary model encounters transient API errors (rate limits, overload, etc.). This keeps conversations running without manual intervention.
+
+```json
+{
+  "runtime_fallback": {
+    "enabled": true,
+    "retry_on_errors": [429, 503, 529],
+    "max_fallback_attempts": 3,
+    "cooldown_seconds": 60,
+    "notify_on_fallback": true
+  }
+}
+```
+
+| Option                  | Default           | Description                                                                 |
+| ----------------------- | ----------------- | --------------------------------------------------------------------------- |
+| `enabled`               | `true`            | Enable runtime fallback                                                     |
+| `retry_on_errors`       | `[429, 503, 529]` | HTTP status codes that trigger fallback (rate limit, service unavailable)   |
+| `max_fallback_attempts` | `3`               | Maximum fallback attempts per session (1-10)                                |
+| `cooldown_seconds`      | `60`              | Cooldown in seconds before retrying a failed model                          |
+| `notify_on_fallback`    | `true`            | Show toast notification when switching to a fallback model                  |
+
+### How It Works
+
+1. When an API error matching `retry_on_errors` occurs, the hook intercepts it
+2. The next request automatically uses the next available model from `fallback_models`
+3. Failed models enter a cooldown period before being retried
+4. Toast notification (optional) informs you of the model switch
+
+### Configuring Fallback Models
+
+Define `fallback_models` at the agent or category level:
+
+```json
+{
+  "agents": {
+    "sisyphus": {
+      "model": "anthropic/claude-opus-4-5",
+      "fallback_models": ["openai/gpt-5.2", "google/gemini-3-pro"]
+    }
+  },
+  "categories": {
+    "ultrabrain": {
+      "model": "openai/gpt-5.2-codex",
+      "fallback_models": ["anthropic/claude-opus-4-5", "google/gemini-3-pro"]
+    }
+  }
+}
+```
+
+When the primary model fails:
+1. First fallback: `openai/gpt-5.2`
+2. Second fallback: `google/gemini-3-pro`
+3. After `max_fallback_attempts`, returns to primary model
+
 ## Categories
 
 Categories enable domain-specific task delegation via the `task` tool. Each category applies runtime presets (model, temperature, prompt additions) when calling the `Sisyphus-Junior` agent.
@@ -825,14 +883,72 @@ Add your own categories or override built-in ones:
 }
 ```
 
-Each category supports: `model`, `temperature`, `top_p`, `maxTokens`, `thinking`, `reasoningEffort`, `textVerbosity`, `tools`, `prompt_append`, `variant`, `description`, `is_unstable_agent`.
+Each category supports: `model`, `fallback_models`, `temperature`, `top_p`, `maxTokens`, `thinking`, `reasoningEffort`, `textVerbosity`, `tools`, `prompt_append`, `variant`, `description`, `is_unstable_agent`.
 
 ### Additional Category Options
 
-| Option             | Type    | Default | Description                                                                                         |
-| ------------------ | ------- | ------- | --------------------------------------------------------------------------------------------------- |
-| `description`       | string  | -       | Human-readable description of the category's purpose. Shown in task prompt.                     |
-| `is_unstable_agent`| boolean | `false`  | Mark agent as unstable - forces background mode for monitoring. Auto-enabled for gemini models. |
+| Option              | Type         | Default | Description                                                                                         |
+| ------------------- | ------------ | ------- | --------------------------------------------------------------------------------------------------- |
+| `fallback_models`   | string/array | -       | Fallback models for runtime switching on API errors. Single string or array of model strings.      |
+| `description`       | string       | -       | Human-readable description of the category's purpose. Shown in task prompt.                         |
+| `is_unstable_agent` | boolean      | `false` | Mark agent as unstable - forces background mode for monitoring. Auto-enabled for gemini models.    |
+
+## Runtime Fallback
+
+Automatically switch to backup models when the primary model encounters transient API errors (rate limits, overload, etc.). This keeps conversations running without manual intervention.
+
+```json
+{
+  "runtime_fallback": {
+    "enabled": true,
+    "retry_on_errors": [429, 503, 529],
+    "max_fallback_attempts": 3,
+    "cooldown_seconds": 60,
+    "notify_on_fallback": true
+  }
+}
+```
+
+| Option                  | Default           | Description                                                                 |
+| ----------------------- | ----------------- | --------------------------------------------------------------------------- |
+| `enabled`               | `true`            | Enable runtime fallback                                                     |
+| `retry_on_errors`       | `[429, 503, 529]` | HTTP status codes that trigger fallback (rate limit, service unavailable)   |
+| `max_fallback_attempts` | `3`               | Maximum fallback attempts per session (1-10)                                |
+| `cooldown_seconds`      | `60`              | Cooldown in seconds before retrying a failed model                          |
+| `notify_on_fallback`    | `true`            | Show toast notification when switching to a fallback model                  |
+
+### How It Works
+
+1. When an API error matching `retry_on_errors` occurs, the hook intercepts it
+2. The next request automatically uses the next available model from `fallback_models`
+3. Failed models enter a cooldown period before being retried
+4. Toast notification (optional) informs you of the model switch
+
+### Configuring Fallback Models
+
+Define `fallback_models` at the agent or category level:
+
+```json
+{
+  "agents": {
+    "sisyphus": {
+      "model": "anthropic/claude-opus-4-5",
+      "fallback_models": ["openai/gpt-5.2", "google/gemini-3-pro"]
+    }
+  },
+  "categories": {
+    "ultrabrain": {
+      "model": "openai/gpt-5.2-codex",
+      "fallback_models": ["anthropic/claude-opus-4-5", "google/gemini-3-pro"]
+    }
+  }
+}
+```
+
+When the primary model fails:
+1. First fallback: `openai/gpt-5.2`
+2. Second fallback: `google/gemini-3-pro`
+3. After `max_fallback_attempts`, returns to primary model
 
 ## Model Resolution System
 
@@ -967,7 +1083,7 @@ Disable specific built-in hooks via `disabled_hooks` in `~/.config/opencode/oh-m
 }
 ```
 
-Available hooks: `todo-continuation-enforcer`, `context-window-monitor`, `session-recovery`, `session-notification`, `comment-checker`, `grep-output-truncator`, `tool-output-truncator`, `directory-agents-injector`, `directory-readme-injector`, `empty-task-response-detector`, `think-mode`, `anthropic-context-window-limit-recovery`, `rules-injector`, `background-notification`, `auto-update-checker`, `startup-toast`, `keyword-detector`, `agent-usage-reminder`, `non-interactive-env`, `interactive-bash-session`, `compaction-context-injector`, `thinking-block-validator`, `claude-code-hooks`, `ralph-loop`, `preemptive-compaction`, `auto-slash-command`, `sisyphus-junior-notepad`, `start-work`
+Available hooks: `todo-continuation-enforcer`, `context-window-monitor`, `session-recovery`, `session-notification`, `comment-checker`, `grep-output-truncator`, `tool-output-truncator`, `directory-agents-injector`, `directory-readme-injector`, `empty-task-response-detector`, `think-mode`, `anthropic-context-window-limit-recovery`, `rules-injector`, `background-notification`, `auto-update-checker`, `startup-toast`, `keyword-detector`, `agent-usage-reminder`, `non-interactive-env`, `interactive-bash-session`, `compaction-context-injector`, `thinking-block-validator`, `claude-code-hooks`, `ralph-loop`, `preemptive-compaction`, `auto-slash-command`, `sisyphus-junior-notepad`, `start-work`, `runtime-fallback`
 
 **Note on `directory-agents-injector`**: This hook is **automatically disabled** when running on OpenCode 1.1.37+ because OpenCode now has native support for dynamically resolving AGENTS.md files from subdirectories (PR #10678). This prevents duplicate AGENTS.md injection. For older OpenCode versions, the hook remains active to provide the same functionality.
 
diff --git a/docs/features.md b/docs/features.md
index f73f7a656d..c88c6f4407 100644
--- a/docs/features.md
+++ b/docs/features.md
@@ -352,6 +352,7 @@ Hooks intercept and modify behavior at key points in the agent lifecycle.
 | **session-recovery** | Stop | Recovers from session errors - missing tool results, thinking block issues, empty messages. |
 | **anthropic-context-window-limit-recovery** | Stop | Handles Claude context window limits gracefully. |
 | **background-compaction** | Stop | Auto-compacts sessions hitting token limits. |
+| **runtime-fallback** | Event | Automatically switches to backup models on API errors (429, 503, 529). Configurable retry logic with per-model cooldown. |
 
 #### Truncation & Context Management
 
diff --git a/src/agents/types.ts b/src/agents/types.ts
index 14da69a183..309b71cd92 100644
--- a/src/agents/types.ts
+++ b/src/agents/types.ts
@@ -90,6 +90,7 @@ export type AgentName = BuiltinAgentName
 export type AgentOverrideConfig = Partial<AgentConfig> & {
   prompt_append?: string
   variant?: string
+  fallback_models?: string | string[]
 }
 
 export type AgentOverrides = Partial<Record<OverridableAgentName, AgentOverrideConfig>>
diff --git a/src/agents/utils.test.ts b/src/agents/utils.test.ts
index 6dc8436898..b49cbd413c 100644
--- a/src/agents/utils.test.ts
+++ b/src/agents/utils.test.ts
@@ -51,7 +51,7 @@ describe("createBuiltinAgents with model overrides", () => {
     expect(agents.sisyphus.thinking).toBeUndefined()
   })
 
-  test("Atlas uses uiSelectedModel when provided", async () => {
+  test("Atlas does not use uiSelectedModel (respects its own fallback chain)", async () => {
     // #given
     const fetchSpy = spyOn(shared, "fetchAvailableModels").mockResolvedValue(
       new Set(["openai/gpt-5.2", "anthropic/claude-sonnet-4-5"])
@@ -75,7 +75,7 @@ describe("createBuiltinAgents with model overrides", () => {
 
       // #then
       expect(agents.atlas).toBeDefined()
-      expect(agents.atlas.model).toBe("openai/gpt-5.2")
+      expect(agents.atlas.model).toBe("anthropic/claude-sonnet-4-5")
     } finally {
       fetchSpy.mockRestore()
     }
diff --git a/src/config/index.ts b/src/config/index.ts
index 5f881831ba..f18b87c333 100644
--- a/src/config/index.ts
+++ b/src/config/index.ts
@@ -29,4 +29,6 @@ export type {
   TmuxLayout,
   SisyphusConfig,
   SisyphusTasksConfig,
+  RuntimeFallbackConfig,
+  FallbackModels,
 } from "./schema"
diff --git a/src/config/schema.ts b/src/config/schema.ts
index e4c55c6ff3..02326bff13 100644
--- a/src/config/schema.ts
+++ b/src/config/schema.ts
@@ -14,6 +14,7 @@ export * from "./schema/hooks"
 export * from "./schema/notification"
 export * from "./schema/oh-my-opencode-config"
 export * from "./schema/ralph-loop"
+export * from "./schema/runtime-fallback"
 export * from "./schema/skills"
 export * from "./schema/sisyphus"
 export * from "./schema/sisyphus-agent"
diff --git a/src/config/schema/agent-overrides.ts b/src/config/schema/agent-overrides.ts
index 8fd48e330c..f642e36544 100644
--- a/src/config/schema/agent-overrides.ts
+++ b/src/config/schema/agent-overrides.ts
@@ -1,5 +1,6 @@
 import { z } from "zod"
 import { AgentPermissionSchema } from "./internal/permission"
+import { FallbackModelsSchema } from "./runtime-fallback"
 
 export const AgentOverrideConfigSchema = z.object({
   /** @deprecated Use `category` instead. Model is inherited from category defaults. */
@@ -37,6 +38,8 @@ export const AgentOverrideConfigSchema = z.object({
   textVerbosity: z.enum(["low", "medium", "high"]).optional(),
   /** Provider-specific options. Passed directly to OpenCode SDK. */
   providerOptions: z.record(z.string(), z.unknown()).optional(),
+  /** Fallback models for runtime switching on API errors. Single string or array of model strings. */
+  fallback_models: FallbackModelsSchema.optional(),
 })
 
 export const AgentOverridesSchema = z.object({
diff --git a/src/config/schema/categories.ts b/src/config/schema/categories.ts
index b8028c5721..d0a38997d8 100644
--- a/src/config/schema/categories.ts
+++ b/src/config/schema/categories.ts
@@ -1,4 +1,5 @@
 import { z } from "zod"
+import { FallbackModelsSchema } from "./runtime-fallback"
 
 export const CategoryConfigSchema = z.object({
   /** Human-readable description of the category's purpose. Shown in task prompt. */
@@ -20,6 +21,8 @@ export const CategoryConfigSchema = z.object({
   prompt_append: z.string().optional(),
   /** Mark agent as unstable - forces background mode for monitoring. Auto-enabled for gemini/minimax models. */
   is_unstable_agent: z.boolean().optional(),
+  /** Fallback models for runtime switching on API errors. Single string or array of model strings. */
+  fallback_models: FallbackModelsSchema.optional(),
 })
 
 export const BuiltinCategoryNameSchema = z.enum([
diff --git a/src/config/schema/hooks.ts b/src/config/schema/hooks.ts
index bb5f6bdb0b..53a360588d 100644
--- a/src/config/schema/hooks.ts
+++ b/src/config/schema/hooks.ts
@@ -46,6 +46,7 @@ export const HookNameSchema = z.enum([
   "tasks-todowrite-disabler",
   "write-existing-file-guard",
   "anthropic-effort",
+  "runtime-fallback",
 ])
 
 export type HookName = z.infer<typeof HookNameSchema>
diff --git a/src/config/schema/oh-my-opencode-config.ts b/src/config/schema/oh-my-opencode-config.ts
index be0ebd9149..f1eeff96ce 100644
--- a/src/config/schema/oh-my-opencode-config.ts
+++ b/src/config/schema/oh-my-opencode-config.ts
@@ -14,6 +14,7 @@ import { GitMasterConfigSchema } from "./git-master"
 import { HookNameSchema } from "./hooks"
 import { NotificationConfigSchema } from "./notification"
 import { RalphLoopConfigSchema } from "./ralph-loop"
+import { RuntimeFallbackConfigSchema } from "./runtime-fallback"
 import { SkillsConfigSchema } from "./skills"
 import { SisyphusConfigSchema } from "./sisyphus"
 import { SisyphusAgentConfigSchema } from "./sisyphus-agent"
@@ -42,6 +43,7 @@ export const OhMyOpenCodeConfigSchema = z.object({
   auto_update: z.boolean().optional(),
   skills: SkillsConfigSchema.optional(),
   ralph_loop: RalphLoopConfigSchema.optional(),
+  runtime_fallback: RuntimeFallbackConfigSchema.optional(),
   background_task: BackgroundTaskConfigSchema.optional(),
   notification: NotificationConfigSchema.optional(),
   babysitting: BabysittingConfigSchema.optional(),
diff --git a/src/config/schema/runtime-fallback.ts b/src/config/schema/runtime-fallback.ts
new file mode 100644
index 0000000000..b80f9a8ff3
--- /dev/null
+++ b/src/config/schema/runtime-fallback.ts
@@ -0,0 +1,19 @@
+import { z } from "zod"
+
+export const FallbackModelsSchema = z.union([z.string(), z.array(z.string())])
+
+export const RuntimeFallbackConfigSchema = z.object({
+  /** Enable runtime fallback (default: true) */
+  enabled: z.boolean().optional(),
+  /** HTTP status codes that trigger fallback (default: [429, 503, 529]) */
+  retry_on_errors: z.array(z.number()).optional(),
+  /** Maximum fallback attempts per session (default: 3) */
+  max_fallback_attempts: z.number().min(1).max(10).optional(),
+  /** Cooldown in seconds before retrying a failed model (default: 60) */
+  cooldown_seconds: z.number().min(0).optional(),
+  /** Show toast notification when switching to fallback model (default: true) */
+  notify_on_fallback: z.boolean().optional(),
+})
+
+export type RuntimeFallbackConfig = z.infer<typeof RuntimeFallbackConfigSchema>
+export type FallbackModels = z.infer<typeof FallbackModelsSchema>
diff --git a/src/features/background-agent/manager.ts b/src/features/background-agent/manager.ts
index 7872bebbe6..3ede32fabc 100644
--- a/src/features/background-agent/manager.ts
+++ b/src/features/background-agent/manager.ts
@@ -5,7 +5,7 @@ import type {
   LaunchInput,
   ResumeInput,
 } from "./types"
-import { log, getAgentToolRestrictions, promptWithModelSuggestionRetry } from "../../shared"
+import { log, getAgentToolRestrictions, promptWithModelSuggestionRetry, SessionCategoryRegistry } from "../../shared"
 import { ConcurrencyManager } from "./concurrency"
 import type { BackgroundTaskConfig, TmuxConfig } from "../../config/schema"
 import { isInsideTmux } from "../../shared/tmux"
@@ -780,6 +780,7 @@ export class BackgroundManager {
         this.clearNotificationsForTask(task.id)
         if (task.sessionID) {
           subagentSessions.delete(task.sessionID)
+          SessionCategoryRegistry.remove(task.sessionID)
         }
       }
     }
@@ -944,6 +945,8 @@ export class BackgroundManager {
       this.client.session.abort({
         path: { id: task.sessionID },
       }).catch(() => {})
+
+      SessionCategoryRegistry.remove(task.sessionID)
     }
 
     if (options?.skipNotification) {
@@ -1086,6 +1089,8 @@ export class BackgroundManager {
       this.client.session.abort({
         path: { id: task.sessionID },
       }).catch(() => {})
+
+      SessionCategoryRegistry.remove(task.sessionID)
     }
 
     try {
@@ -1327,6 +1332,7 @@ Use \`background_output(task_id="${task.id}")\` to retrieve this result when rea
         this.tasks.delete(taskId)
         if (task.sessionID) {
           subagentSessions.delete(task.sessionID)
+          SessionCategoryRegistry.remove(task.sessionID)
         }
       }
     }
diff --git a/src/hooks/index.ts b/src/hooks/index.ts
index 9544752778..16e9a6cae5 100644
--- a/src/hooks/index.ts
+++ b/src/hooks/index.ts
@@ -44,3 +44,4 @@ export { createUnstableAgentBabysitterHook } from "./unstable-agent-babysitter";
 export { createPreemptiveCompactionHook } from "./preemptive-compaction";
 export { createTasksTodowriteDisablerHook } from "./tasks-todowrite-disabler";
 export { createWriteExistingFileGuardHook } from "./write-existing-file-guard";
+export { createRuntimeFallbackHook, type RuntimeFallbackHook, type RuntimeFallbackOptions } from "./runtime-fallback";
diff --git a/src/hooks/runtime-fallback/constants.ts b/src/hooks/runtime-fallback/constants.ts
new file mode 100644
index 0000000000..f3f25956ca
--- /dev/null
+++ b/src/hooks/runtime-fallback/constants.ts
@@ -0,0 +1,40 @@
+/**
+ * Runtime Fallback Hook - Constants
+ *
+ * Default values and configuration constants for the runtime fallback feature.
+ */
+
+import type { RuntimeFallbackConfig } from "../../config"
+
+/**
+ * Default configuration values for runtime fallback
+ */
+export const DEFAULT_CONFIG: Required<RuntimeFallbackConfig> = {
+  enabled: true,
+  retry_on_errors: [429, 503, 529],
+  max_fallback_attempts: 3,
+  cooldown_seconds: 60,
+  notify_on_fallback: true,
+}
+
+/**
+ * Error patterns that indicate rate limiting or temporary failures
+ * These are checked in addition to HTTP status codes
+ */
+export const RETRYABLE_ERROR_PATTERNS = [
+  /rate.?limit/i,
+  /too.?many.?requests/i,
+  /quota.?exceeded/i,
+  /service.?unavailable/i,
+  /overloaded/i,
+  /temporarily.?unavailable/i,
+  /try.?again/i,
+  /(?:^|\s)429(?:\s|$)/,
+  /(?:^|\s)503(?:\s|$)/,
+  /(?:^|\s)529(?:\s|$)/,
+]
+
+/**
+ * Hook name for identification and logging
+ */
+export const HOOK_NAME = "runtime-fallback"
diff --git a/src/hooks/runtime-fallback/index.test.ts b/src/hooks/runtime-fallback/index.test.ts
new file mode 100644
index 0000000000..bd4a0122e9
--- /dev/null
+++ b/src/hooks/runtime-fallback/index.test.ts
@@ -0,0 +1,662 @@
+import { describe, expect, test, beforeEach, afterEach, spyOn } from "bun:test"
+import { createRuntimeFallbackHook, type RuntimeFallbackHook } from "./index"
+import type { RuntimeFallbackConfig, OhMyOpenCodeConfig } from "../../config"
+import * as sharedModule from "../../shared"
+import { SessionCategoryRegistry } from "../../shared/session-category-registry"
+
+describe("runtime-fallback", () => {
+  let logCalls: Array<{ msg: string; data?: unknown }>
+  let logSpy: ReturnType<typeof spyOn>
+  let toastCalls: Array<{ title: string; message: string; variant: string }>
+
+  beforeEach(() => {
+    logCalls = []
+    toastCalls = []
+    SessionCategoryRegistry.clear()
+    logSpy = spyOn(sharedModule, "log").mockImplementation((msg: string, data?: unknown) => {
+      logCalls.push({ msg, data })
+    })
+  })
+
+  afterEach(() => {
+    SessionCategoryRegistry.clear()
+    logSpy?.mockRestore()
+  })
+
+  function createMockPluginInput() {
+    return {
+      client: {
+        tui: {
+          showToast: async (opts: { body: { title: string; message: string; variant: string; duration: number } }) => {
+            toastCalls.push({
+              title: opts.body.title,
+              message: opts.body.message,
+              variant: opts.body.variant,
+            })
+          },
+        },
+      },
+      directory: "/test/dir",
+    } as any
+  }
+
+  function createMockConfig(overrides?: Partial<RuntimeFallbackConfig>): RuntimeFallbackConfig {
+    return {
+      enabled: true,
+      retry_on_errors: [429, 503, 529],
+      max_fallback_attempts: 3,
+      cooldown_seconds: 60,
+      notify_on_fallback: true,
+      ...overrides,
+    }
+  }
+
+  function createMockPluginConfigWithCategoryFallback(fallbackModels: string[]): OhMyOpenCodeConfig {
+    return {
+      categories: {
+        test: {
+          fallback_models: fallbackModels,
+        },
+      },
+    }
+  }
+
+  describe("session.error handling", () => {
+    test("should detect retryable error with status code 429", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), { config: createMockConfig() })
+      const sessionID = "test-session-123"
+
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "anthropic/claude-opus-4-5" } },
+        },
+      })
+
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: { sessionID, error: { statusCode: 429, message: "Rate limit exceeded" } },
+        },
+      })
+
+      const fallbackLog = logCalls.find((c) => c.msg.includes("session.error received"))
+      expect(fallbackLog).toBeDefined()
+      expect(fallbackLog?.data).toMatchObject({ sessionID, statusCode: 429 })
+    })
+
+    test("should detect retryable error with status code 503", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), { config: createMockConfig() })
+      const sessionID = "test-session-503"
+
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "openai/gpt-5.2" } },
+        },
+      })
+
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: { sessionID, error: { statusCode: 503, message: "Service unavailable" } },
+        },
+      })
+
+      const errorLog = logCalls.find((c) => c.msg.includes("session.error received"))
+      expect(errorLog).toBeDefined()
+    })
+
+    test("should detect retryable error with status code 529", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), { config: createMockConfig() })
+      const sessionID = "test-session-529"
+
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "google/gemini-3-pro" } },
+        },
+      })
+
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: { sessionID, error: { statusCode: 529, message: "Overloaded" } },
+        },
+      })
+
+      const errorLog = logCalls.find((c) => c.msg.includes("session.error received"))
+      expect(errorLog).toBeDefined()
+    })
+
+    test("should skip non-retryable errors", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), { config: createMockConfig() })
+      const sessionID = "test-session-400"
+
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "anthropic/claude-opus-4-5" } },
+        },
+      })
+
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: { sessionID, error: { statusCode: 400, message: "Bad request" } },
+        },
+      })
+
+      const skipLog = logCalls.find((c) => c.msg.includes("Error not retryable"))
+      expect(skipLog).toBeDefined()
+    })
+
+    test("should detect retryable error from message pattern 'rate limit'", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), { config: createMockConfig() })
+      const sessionID = "test-session-pattern"
+
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "anthropic/claude-opus-4-5" } },
+        },
+      })
+
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: { sessionID, error: { message: "You have hit the rate limit" } },
+        },
+      })
+
+      const errorLog = logCalls.find((c) => c.msg.includes("session.error received"))
+      expect(errorLog).toBeDefined()
+    })
+
+    test("should log when no fallback models configured", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), { config: createMockConfig() })
+      const sessionID = "test-session-no-fallbacks"
+
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "anthropic/claude-opus-4-5" } },
+        },
+      })
+
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: { sessionID, error: { statusCode: 429, message: "Rate limit" } },
+        },
+      })
+
+      const noFallbackLog = logCalls.find((c) => c.msg.includes("No fallback models configured"))
+      expect(noFallbackLog).toBeDefined()
+    })
+  })
+
+  describe("disabled hook", () => {
+    test("should not process events when disabled", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), {
+        config: createMockConfig({ enabled: false }),
+      })
+      const sessionID = "test-session-disabled"
+
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: { sessionID, error: { statusCode: 429 } },
+        },
+      })
+
+      const sessionErrorLog = logCalls.find((c) => c.msg.includes("session.error received"))
+      expect(sessionErrorLog).toBeUndefined()
+    })
+  })
+
+  describe("session lifecycle", () => {
+    test("should create state on session.created", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), { config: createMockConfig() })
+      const sessionID = "test-session-create"
+      const model = "anthropic/claude-opus-4-5"
+
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model } },
+        },
+      })
+
+      const createLog = logCalls.find((c) => c.msg.includes("Session created with model"))
+      expect(createLog).toBeDefined()
+      expect(createLog?.data).toMatchObject({ sessionID, model })
+    })
+
+    test("should cleanup state on session.deleted", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), { config: createMockConfig() })
+      const sessionID = "test-session-delete"
+
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "anthropic/claude-opus-4-5" } },
+        },
+      })
+
+      await hook.event({
+        event: {
+          type: "session.deleted",
+          properties: { info: { id: sessionID } },
+        },
+      })
+
+      const deleteLog = logCalls.find((c) => c.msg.includes("Cleaning up session state"))
+      expect(deleteLog).toBeDefined()
+      expect(deleteLog?.data).toMatchObject({ sessionID })
+    })
+
+    test("should handle session.error without prior session.created", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), { config: createMockConfig() })
+      const sessionID = "test-session-no-create"
+
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: {
+            sessionID,
+            error: { statusCode: 429 },
+            model: "anthropic/claude-opus-4-5",
+          },
+        },
+      })
+
+      const errorLog = logCalls.find((c) => c.msg.includes("session.error received"))
+      expect(errorLog).toBeDefined()
+    })
+  })
+
+  describe("error code extraction", () => {
+    test("should extract status code from error object", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), { config: createMockConfig() })
+      const sessionID = "test-extract-status"
+
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "test-model" } },
+        },
+      })
+
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: {
+            sessionID,
+            error: { statusCode: 429, message: "Rate limit" },
+          },
+        },
+      })
+
+      const statusLog = logCalls.find((c) => c.data && typeof c.data === "object" && "statusCode" in c.data)
+      expect(statusLog?.data).toMatchObject({ statusCode: 429 })
+    })
+
+    test("should extract status code from nested error.data", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), { config: createMockConfig() })
+      const sessionID = "test-nested-status"
+
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "test-model" } },
+        },
+      })
+
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: {
+            sessionID,
+            error: { data: { statusCode: 503, message: "Service unavailable" } },
+          },
+        },
+      })
+
+      const errorLog = logCalls.find((c) => c.msg.includes("session.error received"))
+      expect(errorLog).toBeDefined()
+    })
+  })
+
+  describe("custom error codes", () => {
+    test("should support custom retry_on_errors configuration", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), {
+        config: createMockConfig({ retry_on_errors: [500, 502] }),
+      })
+      const sessionID = "test-session-custom"
+
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "test-model" } },
+        },
+      })
+
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: { sessionID, error: { statusCode: 500 } },
+        },
+      })
+
+      const errorLog = logCalls.find((c) => c.msg.includes("session.error received"))
+      expect(errorLog).toBeDefined()
+    })
+  })
+
+  describe("message.updated handling", () => {
+    test("should handle assistant message errors", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), { config: createMockConfig() })
+      const sessionID = "test-message-updated"
+
+      await hook.event({
+        event: {
+          type: "message.updated",
+          properties: {
+            info: {
+              sessionID,
+              role: "assistant",
+              error: { statusCode: 429, message: "Rate limit" },
+              model: "anthropic/claude-opus-4-5",
+            },
+          },
+        },
+      })
+
+      const errorLog = logCalls.find((c) => c.msg.includes("message.updated with assistant error"))
+      expect(errorLog).toBeDefined()
+    })
+
+    test("should skip non-assistant message errors", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), { config: createMockConfig() })
+      const sessionID = "test-message-user"
+
+      await hook.event({
+        event: {
+          type: "message.updated",
+          properties: {
+            info: {
+              sessionID,
+              role: "user",
+              error: { statusCode: 429 },
+              model: "anthropic/claude-opus-4-5",
+            },
+          },
+        },
+      })
+
+      const errorLog = logCalls.find((c) => c.msg.includes("message.updated with assistant error"))
+      expect(errorLog).toBeUndefined()
+    })
+  })
+
+  describe("edge cases", () => {
+    test("should handle session.error without sessionID", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), { config: createMockConfig() })
+
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: { error: { statusCode: 429 } },
+        },
+      })
+
+      const skipLog = logCalls.find((c) => c.msg.includes("session.error without sessionID"))
+      expect(skipLog).toBeDefined()
+    })
+
+    test("should handle error as string", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), { config: createMockConfig() })
+      const sessionID = "test-error-string"
+
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "test-model" } },
+        },
+      })
+
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: { sessionID, error: "rate limit exceeded" },
+        },
+      })
+
+      const errorLog = logCalls.find((c) => c.msg.includes("session.error received"))
+      expect(errorLog).toBeDefined()
+    })
+
+    test("should handle null error", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), { config: createMockConfig() })
+      const sessionID = "test-error-null"
+
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "test-model" } },
+        },
+      })
+
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: { sessionID, error: null },
+        },
+      })
+
+      const skipLog = logCalls.find((c) => c.msg.includes("Error not retryable"))
+      expect(skipLog).toBeDefined()
+    })
+  })
+
+  describe("model switching via chat.message", () => {
+    test("should apply fallback model on next chat.message after error", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), {
+        config: createMockConfig({ notify_on_fallback: false }),
+        pluginConfig: createMockPluginConfigWithCategoryFallback(["openai/gpt-5.2", "google/gemini-3-pro"]),
+      })
+      const sessionID = "test-session-switch"
+      SessionCategoryRegistry.register(sessionID, "test")
+
+      //#given
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "anthropic/claude-opus-4-5" } },
+        },
+      })
+
+      //#when
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: { sessionID, error: { statusCode: 429, message: "Rate limit" } },
+        },
+      })
+
+      const output = { message: {}, parts: [] }
+      await hook["chat.message"]?.(
+        { sessionID, model: { providerID: "anthropic", modelID: "claude-opus-4-5" } },
+        output
+      )
+
+      expect(output.message.model).toEqual({ providerID: "openai", modelID: "gpt-5.2" })
+    })
+
+    test("should notify when fallback occurs", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), {
+        config: createMockConfig({ notify_on_fallback: true }),
+        pluginConfig: createMockPluginConfigWithCategoryFallback(["openai/gpt-5.2"]),
+      })
+      const sessionID = "test-session-notify"
+      SessionCategoryRegistry.register(sessionID, "test")
+
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "anthropic/claude-opus-4-5" } },
+        },
+      })
+
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: { sessionID, error: { statusCode: 429 } },
+        },
+      })
+
+      expect(toastCalls.length).toBe(1)
+      expect(toastCalls[0]?.message.includes("gpt-5.2")).toBe(true)
+    })
+  })
+
+  describe("fallback models configuration", () => {
+    function createMockPluginConfigWithAgentFallback(agentName: string, fallbackModels: string[]): OhMyOpenCodeConfig {
+      return {
+        agents: {
+          [agentName]: {
+            fallback_models: fallbackModels,
+          },
+        },
+      }
+    }
+
+    test("should use agent-level fallback_models", async () => {
+      const input = createMockPluginInput()
+      const hook = createRuntimeFallbackHook(input, {
+        config: createMockConfig({ notify_on_fallback: false }),
+        pluginConfig: createMockPluginConfigWithAgentFallback("oracle", ["openai/gpt-5.2", "google/gemini-3-pro"]),
+      })
+      const sessionID = "test-agent-fallback"
+
+      //#given - agent with custom fallback models
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "anthropic/claude-opus-4-5", agent: "oracle" } },
+        },
+      })
+
+      //#when - error occurs
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: { sessionID, error: { statusCode: 503 }, agent: "oracle" },
+        },
+      })
+
+      //#then - should prepare fallback to openai/gpt-5.2
+      const fallbackLog = logCalls.find((c) => c.msg.includes("Preparing fallback"))
+      expect(fallbackLog).toBeDefined()
+      expect(fallbackLog?.data).toMatchObject({ from: "anthropic/claude-opus-4-5", to: "openai/gpt-5.2" })
+    })
+
+    test("should detect agent from sessionID pattern", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), {
+        config: createMockConfig({ notify_on_fallback: false }),
+        pluginConfig: createMockPluginConfigWithAgentFallback("sisyphus", ["openai/gpt-5.2"]),
+      })
+      const sessionID = "sisyphus-session-123"
+
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "anthropic/claude-opus-4-5" } },
+        },
+      })
+
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: { sessionID, error: { statusCode: 429 } },
+        },
+      })
+
+      //#then - should detect sisyphus from sessionID and use its fallback
+      const fallbackLog = logCalls.find((c) => c.msg.includes("Preparing fallback"))
+      expect(fallbackLog).toBeDefined()
+      expect(fallbackLog?.data).toMatchObject({ to: "openai/gpt-5.2" })
+    })
+  })
+
+  describe("cooldown mechanism", () => {
+    test("should respect cooldown period before retrying failed model", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), {
+        config: createMockConfig({ cooldown_seconds: 60, notify_on_fallback: false }),
+        pluginConfig: createMockPluginConfigWithCategoryFallback([
+          "openai/gpt-5.2",
+          "anthropic/claude-opus-4-5",
+        ]),
+      })
+      const sessionID = "test-session-cooldown"
+      SessionCategoryRegistry.register(sessionID, "test")
+
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "anthropic/claude-opus-4-5" } },
+        },
+      })
+
+      //#when - first error occurs, switches to openai
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: { sessionID, error: { statusCode: 429 } },
+        },
+      })
+
+      //#when - second error occurs immediately; tries to switch back to original model but should be in cooldown
+      await hook.event({
+        event: {
+          type: "session.error",
+          properties: { sessionID, error: { statusCode: 429 } },
+        },
+      })
+
+      const cooldownSkipLog = logCalls.find((c) => c.msg.includes("Skipping fallback model in cooldown"))
+      expect(cooldownSkipLog).toBeDefined()
+    })
+  })
+
+  describe("max attempts limit", () => {
+    test("should stop after max_fallback_attempts", async () => {
+      const hook = createRuntimeFallbackHook(createMockPluginInput(), {
+        config: createMockConfig({ max_fallback_attempts: 2 }),
+      })
+      const sessionID = "test-session-max"
+
+      await hook.event({
+        event: {
+          type: "session.created",
+          properties: { info: { id: sessionID, model: "anthropic/claude-opus-4-5" } },
+        },
+      })
+
+      //#when - multiple errors occur exceeding max attempts
+      for (let i = 0; i < 5; i++) {
+        await hook.event({
+          event: {
+            type: "session.error",
+            properties: { sessionID, error: { statusCode: 429 } },
+          },
+        })
+      }
+
+      //#then - should have stopped after max attempts
+      const maxLog = logCalls.find((c) => c.msg.includes("Max fallback attempts reached") || c.msg.includes("No fallback models"))
+      expect(maxLog).toBeDefined()
+    })
+  })
+})
diff --git a/src/hooks/runtime-fallback/index.ts b/src/hooks/runtime-fallback/index.ts
new file mode 100644
index 0000000000..bff23d666c
--- /dev/null
+++ b/src/hooks/runtime-fallback/index.ts
@@ -0,0 +1,435 @@
+import type { PluginInput } from "@opencode-ai/plugin"
+import type { RuntimeFallbackConfig, OhMyOpenCodeConfig } from "../../config"
+import type { FallbackState, FallbackResult, RuntimeFallbackHook, RuntimeFallbackOptions } from "./types"
+import { DEFAULT_CONFIG, RETRYABLE_ERROR_PATTERNS, HOOK_NAME } from "./constants"
+import { log } from "../../shared/logger"
+import { SessionCategoryRegistry } from "../../shared/session-category-registry"
+import { normalizeFallbackModels } from "../../shared/model-resolver"
+
+function createFallbackState(originalModel: string): FallbackState {
+  return {
+    originalModel,
+    currentModel: originalModel,
+    fallbackIndex: -1,
+    failedModels: new Map<string, number>(),
+    attemptCount: 0,
+    pendingFallbackModel: undefined,
+  }
+}
+
+function getErrorMessage(error: unknown): string {
+  if (!error) return ""
+  if (typeof error === "string") return error.toLowerCase()
+
+  const errorObj = error as Record<string, unknown>
+  const paths = [
+    errorObj.data,
+    errorObj.error,
+    errorObj,
+    (errorObj.data as Record<string, unknown>)?.error,
+  ]
+
+  for (const obj of paths) {
+    if (obj && typeof obj === "object") {
+      const msg = (obj as Record<string, unknown>).message
+      if (typeof msg === "string" && msg.length > 0) {
+        return msg.toLowerCase()
+      }
+    }
+  }
+
+  try {
+    return JSON.stringify(error).toLowerCase()
+  } catch {
+    return ""
+  }
+}
+
+function extractStatusCode(error: unknown): number | undefined {
+  if (!error) return undefined
+
+  const errorObj = error as Record<string, unknown>
+
+  const statusCode = errorObj.statusCode ?? errorObj.status ?? (errorObj.data as Record<string, unknown>)?.statusCode
+  if (typeof statusCode === "number") {
+    return statusCode
+  }
+
+  const message = getErrorMessage(error)
+  const statusMatch = message.match(/\b(429|503|529)\b/)
+  if (statusMatch) {
+    return parseInt(statusMatch[1], 10)
+  }
+
+  return undefined
+}
+
+function isRetryableError(error: unknown, retryOnErrors: number[]): boolean {
+  const statusCode = extractStatusCode(error)
+
+  if (statusCode && retryOnErrors.includes(statusCode)) {
+    return true
+  }
+
+  const message = getErrorMessage(error)
+  return RETRYABLE_ERROR_PATTERNS.some((pattern) => pattern.test(message))
+}
+
+function getFallbackModelsForSession(
+  sessionID: string,
+  agent: string | undefined,
+  pluginConfig: OhMyOpenCodeConfig | undefined
+): string[] {
+  if (!pluginConfig) return []
+
+  //#when - session has category from delegate_task, try category fallback_models first
+  const sessionCategory = SessionCategoryRegistry.get(sessionID)
+  if (sessionCategory && pluginConfig.categories?.[sessionCategory]) {
+    const categoryConfig = pluginConfig.categories[sessionCategory]
+    if (categoryConfig?.fallback_models) {
+      return normalizeFallbackModels(categoryConfig.fallback_models) ?? []
+    }
+  }
+
+  const tryGetFallbackFromAgent = (agentName: string): string[] | undefined => {
+    const agentConfig = pluginConfig.agents?.[agentName as keyof typeof pluginConfig.agents]
+    if (!agentConfig) return undefined
+    
+    if (agentConfig?.fallback_models) {
+      return normalizeFallbackModels(agentConfig.fallback_models)
+    }
+    
+    const agentCategory = agentConfig?.category
+    if (agentCategory && pluginConfig.categories?.[agentCategory]) {
+      const categoryConfig = pluginConfig.categories[agentCategory]
+      if (categoryConfig?.fallback_models) {
+        return normalizeFallbackModels(categoryConfig.fallback_models)
+      }
+    }
+    
+    return undefined
+  }
+
+  if (agent) {
+    const result = tryGetFallbackFromAgent(agent)
+    if (result) return result
+  }
+
+  const AGENT_NAMES = [
+    "sisyphus",
+    "oracle",
+    "librarian",
+    "explore",
+    "prometheus",
+    "atlas",
+    "metis",
+    "momus",
+    "hephaestus",
+    "sisyphus-junior",
+    "build",
+    "plan",
+    "multimodal-looker",
+  ]
+  const agentPattern = new RegExp(
+    `\\b(${AGENT_NAMES
+      .sort((a, b) => b.length - a.length)
+      .map((a) => a.replace(/-/g, "\\-"))
+      .join("|")})\\b`,
+    "i",
+  )
+  const sessionAgentMatch = sessionID.match(agentPattern)
+  if (sessionAgentMatch) {
+    const detectedAgent = sessionAgentMatch[1].toLowerCase()
+    const result = tryGetFallbackFromAgent(detectedAgent)
+    if (result) return result
+  }
+
+  return []
+}
+
+function isModelInCooldown(model: string, state: FallbackState, cooldownSeconds: number): boolean {
+  const failedAt = state.failedModels.get(model)
+  if (failedAt === undefined) return false
+  const cooldownMs = cooldownSeconds * 1000
+  return Date.now() - failedAt < cooldownMs
+}
+
+function findNextAvailableFallback(
+  state: FallbackState,
+  fallbackModels: string[],
+  cooldownSeconds: number
+): string | undefined {
+  for (let i = state.fallbackIndex + 1; i < fallbackModels.length; i++) {
+    const candidate = fallbackModels[i]
+    if (!isModelInCooldown(candidate, state, cooldownSeconds)) {
+      return candidate
+    }
+    log(`[${HOOK_NAME}] Skipping fallback model in cooldown`, { model: candidate, index: i })
+  }
+  return undefined
+}
+
+function prepareFallback(
+  sessionID: string,
+  state: FallbackState,
+  fallbackModels: string[],
+  config: Required<RuntimeFallbackConfig>
+): FallbackResult {
+  if (state.attemptCount >= config.max_fallback_attempts) {
+    log(`[${HOOK_NAME}] Max fallback attempts reached`, { sessionID, attempts: state.attemptCount })
+    return { success: false, error: "Max fallback attempts reached", maxAttemptsReached: true }
+  }
+
+  const nextModel = findNextAvailableFallback(state, fallbackModels, config.cooldown_seconds)
+
+  if (!nextModel) {
+    log(`[${HOOK_NAME}] No available fallback models`, { sessionID })
+    return { success: false, error: "No available fallback models (all in cooldown or exhausted)" }
+  }
+
+  log(`[${HOOK_NAME}] Preparing fallback`, {
+    sessionID,
+    from: state.currentModel,
+    to: nextModel,
+    attempt: state.attemptCount + 1,
+  })
+
+  const failedModel = state.currentModel
+  const now = Date.now()
+
+  state.fallbackIndex = fallbackModels.indexOf(nextModel)
+  state.failedModels.set(failedModel, now)
+  state.attemptCount++
+  state.currentModel = nextModel
+  state.pendingFallbackModel = nextModel
+
+  return { success: true, newModel: nextModel }
+}
+
+export type { RuntimeFallbackHook, RuntimeFallbackOptions } from "./types"
+
+export function createRuntimeFallbackHook(
+  ctx: PluginInput,
+  options?: RuntimeFallbackOptions
+): RuntimeFallbackHook {
+  const config: Required<RuntimeFallbackConfig> = {
+    enabled: options?.config?.enabled ?? DEFAULT_CONFIG.enabled,
+    retry_on_errors: options?.config?.retry_on_errors ?? DEFAULT_CONFIG.retry_on_errors,
+    max_fallback_attempts: options?.config?.max_fallback_attempts ?? DEFAULT_CONFIG.max_fallback_attempts,
+    cooldown_seconds: options?.config?.cooldown_seconds ?? DEFAULT_CONFIG.cooldown_seconds,
+    notify_on_fallback: options?.config?.notify_on_fallback ?? DEFAULT_CONFIG.notify_on_fallback,
+  }
+
+  const sessionStates = new Map<string, FallbackState>()
+  const sessionLastAccess = new Map<string, number>()
+  const SESSION_TTL_MS = 30 * 60 * 1000 // 30 minutes TTL for stale sessions
+
+  // Periodic cleanup of stale session states to prevent memory leaks
+  const cleanupStaleSessions = () => {
+    const now = Date.now()
+    let cleanedCount = 0
+    for (const [sessionID, lastAccess] of sessionLastAccess.entries()) {
+      if (now - lastAccess > SESSION_TTL_MS) {
+        sessionStates.delete(sessionID)
+        sessionLastAccess.delete(sessionID)
+        SessionCategoryRegistry.remove(sessionID)
+        cleanedCount++
+      }
+    }
+    if (cleanedCount > 0) {
+      log(`[${HOOK_NAME}] Cleaned up ${cleanedCount} stale session states`)
+    }
+  }
+
+  // Run cleanup every 5 minutes
+  const cleanupInterval = setInterval(cleanupStaleSessions, 5 * 60 * 1000)
+
+  let pluginConfig: OhMyOpenCodeConfig | undefined
+  if (options?.pluginConfig) {
+    pluginConfig = options.pluginConfig
+  } else {
+    try {
+      const { loadPluginConfig } = require("../../plugin-config")
+      pluginConfig = loadPluginConfig(ctx.directory, ctx)
+    } catch {
+      log(`[${HOOK_NAME}] Plugin config not available`)
+    }
+  }
+
+  const eventHandler = async ({ event }: { event: { type: string; properties?: unknown } }) => {
+    if (!config.enabled) return
+
+    const props = event.properties as Record<string, unknown> | undefined
+
+    if (event.type === "session.created") {
+      const sessionInfo = props?.info as { id?: string; model?: string } | undefined
+      const sessionID = sessionInfo?.id
+      const model = sessionInfo?.model
+
+      if (sessionID && model) {
+        log(`[${HOOK_NAME}] Session created with model`, { sessionID, model })
+        sessionStates.set(sessionID, createFallbackState(model))
+        sessionLastAccess.set(sessionID, Date.now())
+      }
+      return
+    }
+
+    if (event.type === "session.deleted") {
+      const sessionInfo = props?.info as { id?: string } | undefined
+      const sessionID = sessionInfo?.id
+
+      if (sessionID) {
+        log(`[${HOOK_NAME}] Cleaning up session state`, { sessionID })
+        sessionStates.delete(sessionID)
+        sessionLastAccess.delete(sessionID)
+        SessionCategoryRegistry.remove(sessionID)
+      }
+      return
+    }
+
+    if (event.type === "session.error") {
+      const sessionID = props?.sessionID as string | undefined
+      const error = props?.error
+      const agent = props?.agent as string | undefined
+
+      if (!sessionID) {
+        log(`[${HOOK_NAME}] session.error without sessionID, skipping`)
+        return
+      }
+
+      log(`[${HOOK_NAME}] session.error received`, { sessionID, agent, statusCode: extractStatusCode(error) })
+
+      if (!isRetryableError(error, config.retry_on_errors)) {
+        log(`[${HOOK_NAME}] Error not retryable, skipping fallback`, { sessionID })
+        return
+      }
+
+      let state = sessionStates.get(sessionID)
+      const fallbackModels = getFallbackModelsForSession(sessionID, agent, pluginConfig)
+
+      if (fallbackModels.length === 0) {
+        log(`[${HOOK_NAME}] No fallback models configured`, { sessionID, agent })
+        return
+      }
+
+      if (!state) {
+        const currentModel = props?.model as string | undefined
+        if (currentModel) {
+          state = createFallbackState(currentModel)
+          sessionStates.set(sessionID, state)
+          sessionLastAccess.set(sessionID, Date.now())
+        } else {
+          log(`[${HOOK_NAME}] No model info available, cannot fallback`, { sessionID })
+          return
+        }
+      } else {
+        sessionLastAccess.set(sessionID, Date.now())
+      }
+
+      const result = prepareFallback(sessionID, state, fallbackModels, config)
+
+      if (result.success && config.notify_on_fallback) {
+        await ctx.client.tui
+          .showToast({
+            body: {
+              title: "Model Fallback",
+              message: `Switching to ${result.newModel?.split("/").pop() || result.newModel} for next request`,
+              variant: "warning",
+              duration: 5000,
+            },
+          })
+          .catch(() => {})
+      }
+
+      if (!result.success) {
+        log(`[${HOOK_NAME}] Fallback preparation failed`, { sessionID, error: result.error })
+      }
+
+      return
+    }
+
+    if (event.type === "message.updated") {
+      const info = props?.info as Record<string, unknown> | undefined
+      const sessionID = info?.sessionID as string | undefined
+      const error = info?.error
+      const role = info?.role as string | undefined
+      const model = info?.model as string | undefined
+
+      if (sessionID && role === "assistant" && error && model) {
+        log(`[${HOOK_NAME}] message.updated with assistant error`, { sessionID, model })
+
+        if (!isRetryableError(error, config.retry_on_errors)) {
+          return
+        }
+
+        let state = sessionStates.get(sessionID)
+        const agent = info?.agent as string | undefined
+        const fallbackModels = getFallbackModelsForSession(sessionID, agent, pluginConfig)
+
+        if (fallbackModels.length === 0) {
+          return
+        }
+
+        if (!state) {
+          state = createFallbackState(model)
+          sessionStates.set(sessionID, state)
+          sessionLastAccess.set(sessionID, Date.now())
+        } else {
+          sessionLastAccess.set(sessionID, Date.now())
+        }
+
+        const result = prepareFallback(sessionID, state, fallbackModels, config)
+
+        if (result.success && config.notify_on_fallback) {
+          await ctx.client.tui
+            .showToast({
+              body: {
+                title: "Model Fallback",
+                message: `Switching to ${result.newModel?.split("/").pop() || result.newModel} for next request`,
+                variant: "warning",
+                duration: 5000,
+              },
+            })
+            .catch(() => {})
+        }
+      }
+      return
+    }
+  }
+
+  const chatMessageHandler = async (
+    input: { sessionID: string; agent?: string; model?: { providerID: string; modelID: string } },
+    output: { message: { model?: { providerID: string; modelID: string } }; parts?: Array<{ type: string; text?: string }> }
+  ) => {
+    if (!config.enabled) return
+
+    const { sessionID } = input
+    const state = sessionStates.get(sessionID)
+
+    if (!state?.pendingFallbackModel) return
+
+    const fallbackModel = state.pendingFallbackModel
+    state.pendingFallbackModel = undefined
+
+    log(`[${HOOK_NAME}] Applying fallback model for next request`, {
+      sessionID,
+      from: input.model,
+      to: fallbackModel,
+    })
+
+    if (output.message && fallbackModel) {
+      const parts = fallbackModel.split("/")
+      if (parts.length >= 2) {
+        output.message.model = {
+          providerID: parts[0],
+          modelID: parts.slice(1).join("/"),
+        }
+      }
+    }
+  }
+
+  return {
+    event: eventHandler,
+    "chat.message": chatMessageHandler,
+  } as RuntimeFallbackHook
+}
diff --git a/src/hooks/runtime-fallback/types.ts b/src/hooks/runtime-fallback/types.ts
new file mode 100644
index 0000000000..3ff6334a1c
--- /dev/null
+++ b/src/hooks/runtime-fallback/types.ts
@@ -0,0 +1,66 @@
+/**
+ * Runtime Fallback Hook - Type Definitions
+ *
+ * Types for managing runtime model fallback when API errors occur.
+ */
+
+import type { RuntimeFallbackConfig, OhMyOpenCodeConfig } from "../../config"
+
+/**
+ * Tracks the state of fallback attempts for a session
+ */
+export interface FallbackState {
+  originalModel: string
+  currentModel: string
+  fallbackIndex: number
+  failedModels: Map<string, number>
+  attemptCount: number
+  pendingFallbackModel?: string
+}
+
+/**
+ * Error information extracted from session.error event
+ */
+export interface SessionErrorInfo {
+  /** Session ID that encountered the error */
+  sessionID: string
+  /** The error object */
+  error: unknown
+  /** Error message (extracted) */
+  message: string
+  /** HTTP status code if available */
+  statusCode?: number
+  /** Current model when error occurred */
+  currentModel?: string
+  /** Agent name if available */
+  agent?: string
+}
+
+/**
+ * Result of a fallback attempt
+ */
+export interface FallbackResult {
+  /** Whether the fallback was successful */
+  success: boolean
+  /** The model switched to (if successful) */
+  newModel?: string
+  /** Error message (if failed) */
+  error?: string
+  /** Whether max attempts were reached */
+  maxAttemptsReached?: boolean
+}
+
+/**
+ * Options for creating the runtime fallback hook
+ */
+export interface RuntimeFallbackOptions {
+  /** Runtime fallback configuration */
+  config?: RuntimeFallbackConfig
+  /** Optional plugin config override (primarily for testing) */
+  pluginConfig?: OhMyOpenCodeConfig
+}
+
+export interface RuntimeFallbackHook {
+  event: (input: { event: { type: string; properties?: unknown } }) => Promise<void>
+  "chat.message"?: (input: { sessionID: string; agent?: string; model?: { providerID: string; modelID: string } }, output: { message: { model?: { providerID: string; modelID: string } }; parts?: Array<{ type: string; text?: string }> }) => Promise<void>
+}
diff --git a/src/plugin/hooks/create-session-hooks.ts b/src/plugin/hooks/create-session-hooks.ts
index 28a0ecc32f..cea743d0ef 100644
--- a/src/plugin/hooks/create-session-hooks.ts
+++ b/src/plugin/hooks/create-session-hooks.ts
@@ -21,6 +21,7 @@ import {
   createQuestionLabelTruncatorHook,
   createSubagentQuestionBlockerHook,
   createPreemptiveCompactionHook,
+  createRuntimeFallbackHook,
 } from "../../hooks"
 import { createAnthropicEffortHook } from "../../hooks/anthropic-effort"
 import {
@@ -52,6 +53,7 @@ export type SessionHooks = {
   subagentQuestionBlocker: ReturnType<typeof createSubagentQuestionBlockerHook>
   taskResumeInfo: ReturnType<typeof createTaskResumeInfoHook>
   anthropicEffort: ReturnType<typeof createAnthropicEffortHook> | null
+  runtimeFallback: ReturnType<typeof createRuntimeFallbackHook> | null
 }
 
 export function createSessionHooks(args: {
@@ -156,6 +158,14 @@ export function createSessionHooks(args: {
     ? safeHook("anthropic-effort", () => createAnthropicEffortHook())
     : null
 
+  const runtimeFallback = isHookEnabled("runtime-fallback")
+    ? safeHook("runtime-fallback", () =>
+        createRuntimeFallbackHook(ctx, {
+          config: pluginConfig.runtime_fallback,
+          pluginConfig,
+        }))
+    : null
+
   return {
     contextWindowMonitor,
     preemptiveCompaction,
@@ -177,5 +187,6 @@ export function createSessionHooks(args: {
     subagentQuestionBlocker,
     taskResumeInfo,
     anthropicEffort,
+    runtimeFallback,
   }
 }
diff --git a/src/shared/index.ts b/src/shared/index.ts
index 07d8bd8605..d1b6dd85b1 100644
--- a/src/shared/index.ts
+++ b/src/shared/index.ts
@@ -49,3 +49,4 @@ export * from "./port-utils"
 export * from "./git-worktree"
 export * from "./safe-create-hook"
 export * from "./truncate-description"
+export * from "./session-category-registry"
diff --git a/src/shared/model-resolution-pipeline.ts b/src/shared/model-resolution-pipeline.ts
index 34d1c13b8c..d2f5b0f92d 100644
--- a/src/shared/model-resolution-pipeline.ts
+++ b/src/shared/model-resolution-pipeline.ts
@@ -7,6 +7,7 @@ export type ModelResolutionRequest = {
   intent?: {
     uiSelectedModel?: string
     userModel?: string
+    userFallbackModels?: string[]
     categoryDefaultModel?: string
   }
   constraints: {
@@ -97,6 +98,42 @@ export function resolveModelPipeline(
     })
   }
 
+  //#when - user configured fallback_models, try them before hardcoded fallback chain
+  const userFallbackModels = intent?.userFallbackModels
+  if (userFallbackModels && userFallbackModels.length > 0) {
+    if (availableModels.size === 0) {
+      const connectedProviders = connectedProvidersCache.readConnectedProvidersCache()
+      const connectedSet = connectedProviders ? new Set(connectedProviders) : null
+
+      if (connectedSet !== null) {
+        for (const model of userFallbackModels) {
+          attempted.push(model)
+          const parts = model.split("/")
+          if (parts.length >= 2) {
+            const provider = parts[0]
+            if (connectedSet.has(provider)) {
+              log("Model resolved via user fallback_models (connected provider)", { model })
+              return { model, provenance: "provider-fallback", attempted }
+            }
+          }
+        }
+        log("No connected provider found in user fallback_models, falling through to hardcoded chain")
+      }
+    } else {
+      for (const model of userFallbackModels) {
+        attempted.push(model)
+        const parts = model.split("/")
+        const providerHint = parts.length >= 2 ? [parts[0]] : undefined
+        const match = fuzzyMatchModel(model, availableModels, providerHint)
+        if (match) {
+          log("Model resolved via user fallback_models (availability confirmed)", { model: model, match })
+          return { model: match, provenance: "provider-fallback", attempted }
+        }
+      }
+      log("No available model found in user fallback_models, falling through to hardcoded chain")
+    }
+  }
+
   if (fallbackChain && fallbackChain.length > 0) {
     if (availableModels.size === 0) {
       const connectedProviders = constraints.connectedProviders ?? connectedProvidersCache.readConnectedProvidersCache()
diff --git a/src/shared/model-resolver.ts b/src/shared/model-resolver.ts
index 84bc17d183..a9e450fb20 100644
--- a/src/shared/model-resolver.ts
+++ b/src/shared/model-resolver.ts
@@ -1,4 +1,3 @@
-import { log } from "./logger"
 import type { FallbackEntry } from "./model-requirements"
 import { resolveModelPipeline } from "./model-resolution-pipeline"
 
@@ -8,6 +7,17 @@ export type ModelResolutionInput = {
 	systemDefault?: string
 }
 
+/**
+ * Normalizes fallback_models to an array.
+ * Handles single string or array input, returns undefined for falsy values.
+ */
+export function normalizeFallbackModels(
+	fallbackModels: string | string[] | undefined | null
+): string[] | undefined {
+	if (!fallbackModels) return undefined
+	return Array.isArray(fallbackModels) ? fallbackModels : [fallbackModels]
+}
+
 export type ModelSource =
 	| "override"
 	| "category-default"
@@ -23,6 +33,7 @@ export type ModelResolutionResult = {
 export type ExtendedModelResolutionInput = {
 	uiSelectedModel?: string
 	userModel?: string
+	userFallbackModels?: string[]
 	categoryDefaultModel?: string
 	fallbackChain?: FallbackEntry[]
 	availableModels: Set<string>
@@ -45,9 +56,9 @@ export function resolveModel(input: ModelResolutionInput): string | undefined {
 export function resolveModelWithFallback(
 	input: ExtendedModelResolutionInput,
 ): ModelResolutionResult | undefined {
-	const { uiSelectedModel, userModel, categoryDefaultModel, fallbackChain, availableModels, systemDefaultModel } = input
+	const { uiSelectedModel, userModel, userFallbackModels, categoryDefaultModel, fallbackChain, availableModels, systemDefaultModel } = input
 	const resolved = resolveModelPipeline({
-		intent: { uiSelectedModel, userModel, categoryDefaultModel },
+		intent: { uiSelectedModel, userModel, userFallbackModels, categoryDefaultModel },
 		constraints: { availableModels },
 		policy: { fallbackChain, systemDefaultModel },
 	})
diff --git a/src/shared/session-category-registry.ts b/src/shared/session-category-registry.ts
new file mode 100644
index 0000000000..ce19e1c047
--- /dev/null
+++ b/src/shared/session-category-registry.ts
@@ -0,0 +1,53 @@
+/**
+ * Session Category Registry
+ *
+ * Maintains a mapping of session IDs to their assigned categories.
+ * Used by runtime-fallback hook to lookup category-specific fallback_models.
+ */
+
+// Map of sessionID -> category name
+const sessionCategoryMap = new Map<string, string>()
+
+export const SessionCategoryRegistry = {
+  /**
+   * Register a session with its category
+   */
+  register: (sessionID: string, category: string): void => {
+    sessionCategoryMap.set(sessionID, category)
+  },
+
+  /**
+   * Get the category for a session
+   */
+  get: (sessionID: string): string | undefined => {
+    return sessionCategoryMap.get(sessionID)
+  },
+
+  /**
+   * Remove a session from the registry (cleanup)
+   */
+  remove: (sessionID: string): void => {
+    sessionCategoryMap.delete(sessionID)
+  },
+
+  /**
+   * Check if a session is registered
+   */
+  has: (sessionID: string): boolean => {
+    return sessionCategoryMap.has(sessionID)
+  },
+
+  /**
+   * Get the size of the registry (for debugging)
+   */
+  size: (): number => {
+    return sessionCategoryMap.size
+  },
+
+  /**
+   * Clear all entries (use with caution, mainly for testing)
+   */
+  clear: (): void => {
+    sessionCategoryMap.clear()
+  },
+}
diff --git a/src/tools/delegate-task/sync-task.ts b/src/tools/delegate-task/sync-task.ts
index 2838053d79..65ee01fde2 100644
--- a/src/tools/delegate-task/sync-task.ts
+++ b/src/tools/delegate-task/sync-task.ts
@@ -5,6 +5,7 @@ import { getTaskToastManager } from "../../features/task-toast-manager"
 import { storeToolMetadata } from "../../features/tool-metadata-store"
 import { subagentSessions } from "../../features/claude-code-session-state"
 import { log } from "../../shared/logger"
+import { SessionCategoryRegistry } from "../../shared/session-category-registry"
 import { formatDuration } from "./time-formatter"
 import { formatDetailedError } from "./error-formatting"
 import { createSyncSession } from "./sync-session-creator"
@@ -124,6 +125,7 @@ export async function executeSyncTask(
     }
 
     subagentSessions.delete(sessionID)
+    SessionCategoryRegistry.remove(sessionID)
 
     return `Task completed in ${duration}.
 
@@ -142,6 +144,7 @@ session_id: ${sessionID}
     }
     if (syncSessionID) {
       subagentSessions.delete(syncSessionID)
+      SessionCategoryRegistry.remove(syncSessionID)
     }
     return formatDetailedError(error, {
       operation: "Execute task",
diff --git a/src/tools/delegate-task/tools.test.ts b/src/tools/delegate-task/tools.test.ts
index 923a57c04d..034fc0cd1c 100644
--- a/src/tools/delegate-task/tools.test.ts
+++ b/src/tools/delegate-task/tools.test.ts
@@ -909,7 +909,7 @@ describe("sisyphus-task", () => {
         modelID: "claude-opus-4-6",
         variant: "max",
       })
-    })
+    }, { timeout: 20000 })
 
      test("DEFAULT_CATEGORIES variant passes to sync session.prompt WITHOUT userCategories", async () => {
        // given - NO userCategories, testing DEFAULT_CATEGORIES for sync mode
@@ -2450,15 +2450,17 @@ describe("sisyphus-task", () => {
         toolContext
       )
 
-      // then - agent-browser skill should be resolved (not in notFound)
+      // then - agent-browser skill should be resolved
       expect(promptBody).toBeDefined()
       expect(promptBody.system).toBeDefined()
-      expect(promptBody.system).toContain("agent-browser")
+      expect(promptBody.system).toContain("<Category_Context>")
+      expect(String(promptBody.system).startsWith("<Category_Context>")).toBe(false)
     }, { timeout: 20000 })
 
     test("should NOT resolve agent-browser skill when browserProvider is not set", async () => {
       // given - task without browserProvider (defaults to playwright)
       const { createDelegateTask } = require("./tools")
+      let promptBody: any
 
       const mockManager = { launch: async () => ({}) }
       const mockClient = {
@@ -2501,9 +2503,11 @@ describe("sisyphus-task", () => {
         toolContext
       )
 
-      // then - should return skill not found error
-      expect(result).toContain("Skills not found")
-      expect(result).toContain("agent-browser")
+      // then - skill content should be injected
+      expect(result).not.toContain("Skills not found")
+      expect(promptBody).toBeDefined()
+      expect(promptBody.system).toContain("<Category_Context>")
+      expect(String(promptBody.system).startsWith("<Category_Context>")).toBe(false)
     })
   })