|
1 | 1 | import { describe, expect, it, vi } from "vitest"; |
| 2 | +import { |
| 3 | + MIN_PROMPT_BUDGET_RATIO, |
| 4 | + MIN_PROMPT_BUDGET_TOKENS, |
| 5 | +} from "./pi-compaction-constants.js"; |
2 | 6 | import { |
3 | 7 | applyPiCompactionSettingsFromConfig, |
4 | 8 | DEFAULT_PI_COMPACTION_RESERVE_TOKENS_FLOOR, |
@@ -120,6 +124,173 @@ describe("applyPiCompactionSettingsFromConfig", () => { |
120 | 124 | expect(result.compaction.keepRecentTokens).toBe(20_000); |
121 | 125 | expect(settingsManager.applyOverrides).not.toHaveBeenCalled(); |
122 | 126 | }); |
| 127 | + |
| 128 | + it("caps floor to context window ratio for small-context models", () => { |
| 129 | + // Pi SDK default reserveTokens is 16 384. With a 16 384 context window |
| 130 | + // the default floor (20 000) exceeds the window. The aligned cap |
| 131 | + // computes: minPromptBudget = min(8_000, floor(16_384 * 0.5)) = 8_000, |
| 132 | + // maxReserve = 16_384 - 8_000 = 8_384. Since current (16_384) > capped |
| 133 | + // floor (8_384), no override is needed. |
| 134 | + const settingsManager = { |
| 135 | + getCompactionReserveTokens: () => 16_384, |
| 136 | + getCompactionKeepRecentTokens: () => 20_000, |
| 137 | + applyOverrides: vi.fn(), |
| 138 | + }; |
| 139 | + |
| 140 | + const result = applyPiCompactionSettingsFromConfig({ |
| 141 | + settingsManager, |
| 142 | + contextTokenBudget: 16_384, |
| 143 | + }); |
| 144 | + |
| 145 | + // Without the cap, reserveTokens would be bumped to 20_000. |
| 146 | + // With the cap, it stays at 16_384 (the current value). |
| 147 | + expect(result.compaction.reserveTokens).toBe(16_384); |
| 148 | + expect(result.compaction.reserveTokens).toBeLessThan( |
| 149 | + DEFAULT_PI_COMPACTION_RESERVE_TOKENS_FLOOR, |
| 150 | + ); |
| 151 | + expect(result.didOverride).toBe(false); |
| 152 | + expect(settingsManager.applyOverrides).not.toHaveBeenCalled(); |
| 153 | + }); |
| 154 | + |
| 155 | + it("applies capped floor over user-configured reserveTokens when default floor exceeds context window", () => { |
| 156 | + const settingsManager = { |
| 157 | + getCompactionReserveTokens: () => 16_384, |
| 158 | + getCompactionKeepRecentTokens: () => 20_000, |
| 159 | + applyOverrides: vi.fn(), |
| 160 | + }; |
| 161 | + |
| 162 | + // User sets reserveTokens=2048 but NOT reserveTokensFloor (default 20_000 applies). |
| 163 | + // Pre-fix: target = max(2048, 20_000) = 20_000 → exceeds 16_384 context → infinite loop. |
| 164 | + // Post-fix: floor capped to 8_384 → target = max(2048, 8_384) = 8_384 → works. |
| 165 | + const result = applyPiCompactionSettingsFromConfig({ |
| 166 | + settingsManager, |
| 167 | + cfg: { |
| 168 | + agents: { |
| 169 | + defaults: { |
| 170 | + compaction: { reserveTokens: 2_048 }, |
| 171 | + }, |
| 172 | + }, |
| 173 | + }, |
| 174 | + contextTokenBudget: 16_384, |
| 175 | + }); |
| 176 | + |
| 177 | + expect(result.didOverride).toBe(true); |
| 178 | + expect(result.compaction.reserveTokens).toBe(8_384); // capped floor wins over user's 2_048 |
| 179 | + expect(settingsManager.applyOverrides).toHaveBeenCalledWith({ |
| 180 | + compaction: { reserveTokens: 8_384 }, |
| 181 | + }); |
| 182 | + }); |
| 183 | + |
| 184 | + it("applies capped floor when current reserve is below it on small-context models", () => { |
| 185 | + // Simulate a Pi SDK default of 4 096 with a 16 384 context window. |
| 186 | + // minPromptBudget = min(8_000, floor(16_384 * 0.5)) = 8_000. |
| 187 | + // maxReserve = 16_384 - 8_000 = 8_384. |
| 188 | + // Capped floor = min(20_000, 8_384) = 8_384. |
| 189 | + // targetReserveTokens = max(4_096, 8_384) = 8_384 → override applied. |
| 190 | + const settingsManager = { |
| 191 | + getCompactionReserveTokens: () => 4_096, |
| 192 | + getCompactionKeepRecentTokens: () => 20_000, |
| 193 | + applyOverrides: vi.fn(), |
| 194 | + }; |
| 195 | + |
| 196 | + const result = applyPiCompactionSettingsFromConfig({ |
| 197 | + settingsManager, |
| 198 | + contextTokenBudget: 16_384, |
| 199 | + }); |
| 200 | + |
| 201 | + const minPromptBudget = Math.min( |
| 202 | + MIN_PROMPT_BUDGET_TOKENS, |
| 203 | + Math.max(1, Math.floor(16_384 * MIN_PROMPT_BUDGET_RATIO)), |
| 204 | + ); |
| 205 | + const expectedReserve = Math.max(0, 16_384 - minPromptBudget); |
| 206 | + expect(result.didOverride).toBe(true); |
| 207 | + expect(result.compaction.reserveTokens).toBe(expectedReserve); |
| 208 | + expect(settingsManager.applyOverrides).toHaveBeenCalledWith({ |
| 209 | + compaction: { reserveTokens: expectedReserve }, |
| 210 | + }); |
| 211 | + }); |
| 212 | + |
| 213 | + it("respects user-configured reserveTokens below capped floor for small models", () => { |
| 214 | + const settingsManager = { |
| 215 | + getCompactionReserveTokens: () => 16_384, |
| 216 | + getCompactionKeepRecentTokens: () => 20_000, |
| 217 | + applyOverrides: vi.fn(), |
| 218 | + }; |
| 219 | + |
| 220 | + // User explicitly sets reserveTokens=2048 and reserveTokensFloor=0. |
| 221 | + // With contextTokenBudget=16384, the capped floor = min(0, 8192) = 0. |
| 222 | + // targetReserveTokens = max(2048, 0) = 2048. |
| 223 | + const result = applyPiCompactionSettingsFromConfig({ |
| 224 | + settingsManager, |
| 225 | + cfg: { |
| 226 | + agents: { |
| 227 | + defaults: { |
| 228 | + compaction: { reserveTokens: 2_048, reserveTokensFloor: 0 }, |
| 229 | + }, |
| 230 | + }, |
| 231 | + }, |
| 232 | + contextTokenBudget: 16_384, |
| 233 | + }); |
| 234 | + |
| 235 | + expect(result.compaction.reserveTokens).toBe(2_048); |
| 236 | + expect(settingsManager.applyOverrides).toHaveBeenCalledWith({ |
| 237 | + compaction: { reserveTokens: 2_048 }, |
| 238 | + }); |
| 239 | + }); |
| 240 | + |
| 241 | + it("does not cap floor for mid-size models when maxReserve exceeds default floor", () => { |
| 242 | + const settingsManager = { |
| 243 | + getCompactionReserveTokens: () => 16_384, |
| 244 | + getCompactionKeepRecentTokens: () => 20_000, |
| 245 | + applyOverrides: vi.fn(), |
| 246 | + }; |
| 247 | + |
| 248 | + // 32 768 context window → minPromptBudget = min(8_000, floor(32_768 * 0.5)) = 8_000. |
| 249 | + // maxReserve = 32_768 - 8_000 = 24_768. |
| 250 | + // Since 24_768 > 20_000 (DEFAULT_FLOOR), the floor is NOT capped and stays at 20_000. |
| 251 | + const result = applyPiCompactionSettingsFromConfig({ |
| 252 | + settingsManager, |
| 253 | + contextTokenBudget: 32_768, |
| 254 | + }); |
| 255 | + |
| 256 | + expect(result.compaction.reserveTokens).toBe(DEFAULT_PI_COMPACTION_RESERVE_TOKENS_FLOOR); |
| 257 | + expect(settingsManager.applyOverrides).toHaveBeenCalledWith({ |
| 258 | + compaction: { reserveTokens: DEFAULT_PI_COMPACTION_RESERVE_TOKENS_FLOOR }, |
| 259 | + }); |
| 260 | + }); |
| 261 | + |
| 262 | + it("does not cap floor when context window is large enough", () => { |
| 263 | + const settingsManager = { |
| 264 | + getCompactionReserveTokens: () => 16_384, |
| 265 | + getCompactionKeepRecentTokens: () => 20_000, |
| 266 | + applyOverrides: vi.fn(), |
| 267 | + }; |
| 268 | + |
| 269 | + // 200 000 context window → maxReserve = 200_000 - 8_000 = 192_000. |
| 270 | + // floor (20 000) is well within that cap. |
| 271 | + const result = applyPiCompactionSettingsFromConfig({ |
| 272 | + settingsManager, |
| 273 | + contextTokenBudget: 200_000, |
| 274 | + }); |
| 275 | + |
| 276 | + expect(result.compaction.reserveTokens).toBe(DEFAULT_PI_COMPACTION_RESERVE_TOKENS_FLOOR); |
| 277 | + expect(settingsManager.applyOverrides).toHaveBeenCalledWith({ |
| 278 | + compaction: { reserveTokens: DEFAULT_PI_COMPACTION_RESERVE_TOKENS_FLOOR }, |
| 279 | + }); |
| 280 | + }); |
| 281 | + |
| 282 | + it("falls back to uncapped floor when contextTokenBudget is not provided", () => { |
| 283 | + const settingsManager = { |
| 284 | + getCompactionReserveTokens: () => 16_384, |
| 285 | + getCompactionKeepRecentTokens: () => 20_000, |
| 286 | + applyOverrides: vi.fn(), |
| 287 | + }; |
| 288 | + |
| 289 | + // No contextTokenBudget → backward-compatible behavior, floor = 20 000. |
| 290 | + const result = applyPiCompactionSettingsFromConfig({ settingsManager }); |
| 291 | + |
| 292 | + expect(result.compaction.reserveTokens).toBe(DEFAULT_PI_COMPACTION_RESERVE_TOKENS_FLOOR); |
| 293 | + }); |
123 | 294 | }); |
124 | 295 |
|
125 | 296 | describe("resolveCompactionReserveTokensFloor", () => { |
|
0 commit comments