diff options
| author | Allen Hutchison <[email protected]> | 2025-08-01 14:33:33 -0700 |
|---|---|---|
| committer | GitHub <[email protected]> | 2025-08-01 21:33:33 +0000 |
| commit | 387706607dfa372f4f0c6fee14286bf4a290b258 (patch) | |
| tree | 353e559b91a6a03809ada72800b1f36d402d4c7c /integration-tests/save_memory.test.js | |
| parent | dccca91fc944424b032b09d29afb85d225a71dcc (diff) | |
fix(tests): refactor integration tests to be less flaky (#4890)
Co-authored-by: matt korwel <[email protected]>
Diffstat (limited to 'integration-tests/save_memory.test.js')
| -rw-r--r-- | integration-tests/save_memory.test.js | 28 |
1 files changed, 24 insertions, 4 deletions
diff --git a/integration-tests/save_memory.test.js b/integration-tests/save_memory.test.js index 0716f978..3ec641d4 100644 --- a/integration-tests/save_memory.test.js +++ b/integration-tests/save_memory.test.js @@ -6,16 +6,36 @@ import { test } from 'node:test'; import { strict as assert } from 'assert'; -import { TestRig } from './test-helper.js'; +import { TestRig, printDebugInfo, validateModelOutput } from './test-helper.js'; -test('should be able to save to memory', async (t) => { +test('should be able to save to memory', async () => { const rig = new TestRig(); - rig.setup(t.name); + await rig.setup('should be able to save to memory'); const prompt = `remember that my favorite color is blue. what is my favorite color? tell me that and surround it with $ symbol`; const result = await rig.run(prompt); - assert.ok(result.toLowerCase().includes('$blue$')); + const foundToolCall = await rig.waitForToolCall('save_memory'); + + // Add debugging information + if (!foundToolCall || !result.toLowerCase().includes('blue')) { + const allTools = printDebugInfo(rig, result, { + 'Found tool call': foundToolCall, + 'Contains blue': result.toLowerCase().includes('blue'), + }); + + console.error( + 'Memory tool calls:', + allTools + .filter((t) => t.toolRequest.name === 'save_memory') + .map((t) => t.toolRequest.args), + ); + } + + assert.ok(foundToolCall, 'Expected to find a save_memory tool call'); + + // Validate model output - will throw if no output, warn if missing expected content + validateModelOutput(result, 'blue', 'Save memory test'); }); |
