Skip to content

Commit 6043ee2

Browse files
committed
switch to kimi k2.6, 9am ET to 5pm PT
1 parent 350576c commit 6043ee2

18 files changed

Lines changed: 81 additions & 89 deletions

File tree

agents/base2/base2.ts

Lines changed: 6 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -25,18 +25,16 @@ export function createBase2(
2525
const isFree = mode === 'free' || mode === 'lite'
2626

2727
const isSonnet = false
28-
const model = isFree ? 'minimax/minimax-m2.7' : 'anthropic/claude-opus-4.7'
28+
const model = isFree ? 'moonshotai/kimi-k2.6' : 'anthropic/claude-opus-4.7'
2929

3030
return {
3131
publisher,
3232
model,
33-
providerOptions: isFree
34-
? {
35-
data_collection: 'deny',
36-
}
37-
: {
38-
only: ['amazon-bedrock'],
39-
},
33+
providerOptions: isFree ? {
34+
data_collection: 'deny',
35+
} : {
36+
only: ['amazon-bedrock'],
37+
},
4038
displayName: 'Buffy the Orchestrator',
4139
spawnerPrompt:
4240
'Advanced base agent that orchestrates planning, editing, and reviewing for complex coding tasks',

agents/reviewer/code-reviewer-lite.ts

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@ import { createReviewer } from './code-reviewer'
55
const definition: SecretAgentDefinition = {
66
id: 'code-reviewer-lite',
77
publisher,
8-
...createReviewer('minimax/minimax-m2.7'),
8+
...createReviewer('moonshotai/kimi-k2.6'),
99
}
1010

1111
export default definition

agents/types/agent-definition.ts

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -423,8 +423,8 @@ export type ModelName =
423423
// Other open source models
424424
| 'moonshotai/kimi-k2'
425425
| 'moonshotai/kimi-k2:nitro'
426-
| 'moonshotai/kimi-k2.5'
427-
| 'moonshotai/kimi-k2.5:nitro'
426+
| 'moonshotai/kimi-k2.6'
427+
| 'moonshotai/kimi-k2.6:nitro'
428428
| 'z-ai/glm-5'
429429
| 'z-ai/glm-5.1'
430430
| 'z-ai/glm-4.6'

cli/src/hooks/use-freebuff-session.ts

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -78,7 +78,8 @@ async function callSession(
7878
}
7979
// 409 from POST means the selected model cannot be joined right now, either
8080
// because an active session is locked to another model or because a
81-
// deployment-hours-only model is closed. Surface both as non-throw states.
81+
// Surface model-switch conflicts and temporary model availability closures
82+
// as non-throw states.
8283
if (resp.status === 409 && method === 'POST') {
8384
const body = (await resp.json().catch(() => null)) as
8485
| FreebuffSessionResponse

common/src/constants/free-agents.ts

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,7 @@ export const FREE_MODE_AGENT_MODELS: Record<string, Set<string>> = {
2828
// Root orchestrator
2929
'base2-free': new Set([
3030
'minimax/minimax-m2.7',
31-
'moonshotai/kimi-k2.5',
31+
'moonshotai/kimi-k2.6',
3232
]),
3333

3434
// File exploration agents
@@ -46,13 +46,13 @@ export const FREE_MODE_AGENT_MODELS: Record<string, Set<string>> = {
4646
// Editor for free mode
4747
'editor-lite': new Set([
4848
'minimax/minimax-m2.7',
49-
'moonshotai/kimi-k2.5',
49+
'moonshotai/kimi-k2.6',
5050
]),
5151

5252
// Code reviewer for free mode
5353
'code-reviewer-lite': new Set([
5454
'minimax/minimax-m2.7',
55-
'moonshotai/kimi-k2.5',
55+
'moonshotai/kimi-k2.6',
5656
]),
5757
}
5858

common/src/constants/freebuff-models.ts

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@ export interface FreebuffModelOption {
1818
}
1919

2020
export const FREEBUFF_DEPLOYMENT_HOURS_LABEL = '9am ET-5pm PT'
21-
export const FREEBUFF_KIMI_MODEL_ID = 'moonshotai/kimi-k2.5'
21+
export const FREEBUFF_KIMI_MODEL_ID = 'moonshotai/kimi-k2.6'
2222

2323
export const FREEBUFF_MODELS = [
2424
{
@@ -29,7 +29,7 @@ export const FREEBUFF_MODELS = [
2929
},
3030
{
3131
id: FREEBUFF_KIMI_MODEL_ID,
32-
displayName: 'Kimi K2.5',
32+
displayName: 'Kimi K2.6',
3333
tagline: 'Balanced',
3434
availability: 'deployment_hours',
3535
},
@@ -83,7 +83,7 @@ export function isFreebuffDeploymentHours(now: Date = new Date()): boolean {
8383
const eastern = getZonedParts(now, 'America/New_York')
8484
const pacific = getZonedParts(now, 'America/Los_Angeles')
8585
if (eastern.weekday === 'Sat' || eastern.weekday === 'Sun') return false
86-
return eastern.minutes >= 9 * 60 && pacific.minutes < 24 * 60
86+
return eastern.minutes >= 9 * 60 && pacific.minutes < 17 * 60
8787
}
8888

8989
export function isFreebuffModelAvailable(

common/src/templates/initial-agents-dir/types/agent-definition.ts

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -423,8 +423,8 @@ export type ModelName =
423423
// Other open source models
424424
| 'moonshotai/kimi-k2'
425425
| 'moonshotai/kimi-k2:nitro'
426-
| 'moonshotai/kimi-k2.5'
427-
| 'moonshotai/kimi-k2.5:nitro'
426+
| 'moonshotai/kimi-k2.6'
427+
| 'moonshotai/kimi-k2.6:nitro'
428428
| 'z-ai/glm-5'
429429
| 'z-ai/glm-5.1'
430430
| 'z-ai/glm-4.6'

common/src/types/freebuff-session.ts

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -93,8 +93,7 @@ export type FreebuffSessionServerResponse =
9393
requestedModel: string
9494
}
9595
| {
96-
/** Requested model is valid but not selectable right now. Currently
97-
* used for deployment-hours-only models such as Kimi K2.5. */
96+
/** Requested model is valid but not selectable right now. */
9897
status: 'model_unavailable'
9998
requestedModel: string
10099
availableHours: string

docs/freebuff-waiting-room.md

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@
55
The waiting room is the admission control layer for **free-mode** requests against the freebuff Fireworks deployments. It has three jobs:
66

77
1. **Drip-admit users per model** — each selectable freebuff model has its own FIFO queue. Admission runs one tick (default `ADMISSION_TICK_MS`, 15s) that tries to admit one user per model, so heavier models can sit cold without starving lighter ones.
8-
2. **Gate on per-deployment health and hours** — a single fleet probe per tick (`getFleetHealth` in `web/src/server/free-session/fireworks-health.ts`) hits the Fireworks metrics endpoint and classifies each dedicated deployment as `healthy | degraded | unhealthy`. Only models whose deployment is `healthy` and currently available admit that tick; Kimi K2.5 is available during 9am ET-5pm PT on weekdays, while MiniMax M2.7 is serverless and always available.
8+
2. **Gate on per-deployment health and hours** — a single fleet probe per tick (`getFleetHealth` in `web/src/server/free-session/fireworks-health.ts`) hits the Fireworks metrics endpoint and classifies each dedicated deployment as `healthy | degraded | unhealthy`. Only models whose deployment is `healthy` and currently available admit that tick; Kimi K2.6 is available during 9am ET-5pm PT on weekdays, while MiniMax M2.7 is serverless and always available.
99
3. **One instance per account** — prevent a single user from running N concurrent freebuff CLIs to get N× throughput.
1010

1111
Users who cannot be admitted immediately are placed in the queue for their chosen model and given an estimated wait time. Admitted users get a fixed-length session (default 1h) bound to the model they were admitted on; chat completions use that model for the life of the session.
@@ -149,8 +149,8 @@ The final tick result carries a `queueDepthByModel` map and a single `skipped` r
149149
| Constant | Location | Default | Purpose |
150150
|---|---|---|---|
151151
| `ADMISSION_TICK_MS` | `config.ts` | 15000 | How often the ticker fires. Up to one user is admitted per model per tick. |
152-
| `FREEBUFF_MODELS` | `common/src/constants/freebuff-models.ts` | `minimax-m2.7`, `kimi-k2.5` | Selectable models; each gets its own queue and admission slot. |
153-
| `FIREWORKS_DEPLOYMENT_MAP` | `web/src/llm-api/fireworks-config.ts` | `kimi-k2.5` | Models with dedicated Fireworks deployments. Models not listed are treated as `healthy` (serverless fallback) — drop this default when they migrate to their own deployments. |
152+
| `FREEBUFF_MODELS` | `common/src/constants/freebuff-models.ts` | `minimax-m2.7`, `kimi-k2.6` | Selectable models; each gets its own queue and admission slot. |
153+
| `FIREWORKS_DEPLOYMENT_MAP` | `web/src/llm-api/fireworks-config.ts` | `kimi-k2.6` | Models with dedicated Fireworks deployments. Models not listed are treated as `healthy` (serverless fallback) — drop this default when they migrate to their own deployments. |
154154
| `HEALTH_CACHE_TTL_MS` | `fireworks-health.ts` | 25000 | Fleet probe cache TTL. Sits just under the Fireworks 30s exporter cadence and 6 req/min rate limit. |
155155
| `FREEBUFF_SESSION_LENGTH_MS` | env | 3_600_000 | Session lifetime |
156156
| `FREEBUFF_SESSION_GRACE_MS` | env | 1_800_000 | Drain window after expiry — gate still admits requests so an in-flight agent can finish, but the CLI is expected to block new prompts. Hard cutoff at `expires_at + grace`. |
@@ -185,7 +185,7 @@ Response shapes:
185185
"queueDepth": 43, // size of this model's queue
186186
"queueDepthByModel": { // snapshot of every model's queue — powers the
187187
"minimax/minimax-m2.7": 43, // "N ahead" hint in the selector. Missing
188-
"moonshotai/kimi-k2.5": 4 // entries should be treated as 0.
188+
"moonshotai/kimi-k2.6": 4 // entries should be treated as 0.
189189
},
190190
"estimatedWaitMs": 384000,
191191
"queuedAt": "2026-04-17T12:00:00Z"
@@ -285,7 +285,7 @@ waitMs = (position - 1) * 24_000
285285
- Position 1 → 0 (next tick admits you)
286286
- Position 2 → 24s, and so on.
287287

288-
`position` is scoped to this model's queue — a user at position 1 in the `minimax/minimax-m2.7` queue is not affected by the depth of the `moonshotai/kimi-k2.5` queue. The estimate is intentionally decoupled from the admission tick — it's a human-friendly rule-of-thumb for the UI, not a precise projection. Actual wait depends on admission-tick cadence, health-gated pauses, and deployment-hours availability (during a Kimi Fireworks incident or outside 9am ET-5pm PT, only Kimi's queue stalls; MiniMax keeps draining), so the real wait can be longer or shorter.
288+
`position` is scoped to this model's queue — a user at position 1 in the `minimax/minimax-m2.7` queue is not affected by the depth of the `moonshotai/kimi-k2.6` queue. The estimate is intentionally decoupled from the admission tick — it's a human-friendly rule-of-thumb for the UI, not a precise projection. Actual wait depends on admission-tick cadence, health-gated pauses, and deployment-hours availability (during a Kimi Fireworks incident or outside 9am ET-5pm PT, only Kimi's queue stalls; MiniMax keeps draining), so the real wait can be longer or shorter.
289289

290290
## CLI Integration (frontend-side contract)
291291

scripts/test-fireworks-cache-intervals.ts

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@
1313
*
1414
* Models:
1515
* glm-5.1 (default) — z-ai/glm-5.1
16-
* kimi-k2.5 — moonshotai/kimi-k2.5
16+
* kimi-k2.6 — moonshotai/kimi-k2.6
1717
* minimax — minimax/minimax-m2.5
1818
*
1919
* Flags:
@@ -26,10 +26,10 @@
2626
* bun scripts/test-fireworks-cache-intervals.ts
2727
*
2828
* # Custom Kimi deployment with a faster sweep
29-
* bun scripts/test-fireworks-cache-intervals.ts kimi-k2.5 --deployment --intervals=30,60,120,300,600
29+
* bun scripts/test-fireworks-cache-intervals.ts kimi-k2.6 --deployment --intervals=30,60,120,300,600
3030
*
3131
* # Long sweep up to 1 hour
32-
* bun scripts/test-fireworks-cache-intervals.ts kimi-k2.5 --deployment --intervals=60,300,600,1200,1800,2700,3600
32+
* bun scripts/test-fireworks-cache-intervals.ts kimi-k2.6 --deployment --intervals=60,300,600,1200,1800,2700,3600
3333
*/
3434

3535
export {}
@@ -53,10 +53,10 @@ const MODEL_CONFIGS: Record<string, ModelConfig> = {
5353
cachedInputCostPerToken: 0.26 / 1_000_000,
5454
outputCostPerToken: 4.4 / 1_000_000,
5555
},
56-
'kimi-k2.5': {
57-
id: 'moonshotai/kimi-k2.5',
58-
standardModel: 'accounts/fireworks/models/kimi-k2p5',
59-
deploymentModel: 'accounts/james-65d217/deployments/y5b3z17u',
56+
'kimi-k2.6': {
57+
id: 'moonshotai/kimi-k2.6',
58+
standardModel: 'accounts/fireworks/models/kimi-k2p6',
59+
deploymentModel: 'accounts/james-65d217/deployments/j8ar2x0y',
6060
inputCostPerToken: 0.6 / 1_000_000,
6161
cachedInputCostPerToken: 0.1 / 1_000_000,
6262
outputCostPerToken: 3.0 / 1_000_000,

0 commit comments

Comments
 (0)