summaryrefslogtreecommitdiff
path: root/packages/core/src/services/loopDetectionService.test.ts
diff options
context:
space:
mode:
Diffstat (limited to 'packages/core/src/services/loopDetectionService.test.ts')
-rw-r--r--packages/core/src/services/loopDetectionService.test.ts119
1 files changed, 115 insertions, 4 deletions
diff --git a/packages/core/src/services/loopDetectionService.test.ts b/packages/core/src/services/loopDetectionService.test.ts
index 2d410752..bf3afd32 100644
--- a/packages/core/src/services/loopDetectionService.test.ts
+++ b/packages/core/src/services/loopDetectionService.test.ts
@@ -4,16 +4,18 @@
* SPDX-License-Identifier: Apache-2.0
*/
-import { describe, it, expect, beforeEach, vi } from 'vitest';
-import { LoopDetectionService } from './loopDetectionService.js';
+import { afterEach, beforeEach, describe, expect, it, vi } from 'vitest';
+import { Config } from '../config/config.js';
+import { GeminiClient } from '../core/client.js';
import {
GeminiEventType,
ServerGeminiContentEvent,
+ ServerGeminiStreamEvent,
ServerGeminiToolCallRequestEvent,
} from '../core/turn.js';
-import { ServerGeminiStreamEvent } from '../core/turn.js';
-import { Config } from '../config/config.js';
import * as loggers from '../telemetry/loggers.js';
+import { LoopType } from '../telemetry/types.js';
+import { LoopDetectionService } from './loopDetectionService.js';
vi.mock('../telemetry/loggers.js', () => ({
logLoopDetected: vi.fn(),
@@ -330,3 +332,112 @@ describe('LoopDetectionService', () => {
});
});
});
+
+describe('LoopDetectionService LLM Checks', () => {
+ let service: LoopDetectionService;
+ let mockConfig: Config;
+ let mockGeminiClient: GeminiClient;
+ let abortController: AbortController;
+
+ beforeEach(() => {
+ mockGeminiClient = {
+ getHistory: vi.fn().mockReturnValue([]),
+ generateJson: vi.fn(),
+ } as unknown as GeminiClient;
+
+ mockConfig = {
+ getGeminiClient: () => mockGeminiClient,
+ getDebugMode: () => false,
+ getTelemetryEnabled: () => true,
+ } as unknown as Config;
+
+ service = new LoopDetectionService(mockConfig);
+ abortController = new AbortController();
+ vi.clearAllMocks();
+ });
+
+ afterEach(() => {
+ vi.restoreAllMocks();
+ });
+
+ const advanceTurns = async (count: number) => {
+ for (let i = 0; i < count; i++) {
+ await service.turnStarted(abortController.signal);
+ }
+ };
+
+ it('should not trigger LLM check before LLM_CHECK_AFTER_TURNS', async () => {
+ await advanceTurns(29);
+ expect(mockGeminiClient.generateJson).not.toHaveBeenCalled();
+ });
+
+ it('should trigger LLM check on the 30th turn', async () => {
+ mockGeminiClient.generateJson = vi
+ .fn()
+ .mockResolvedValue({ confidence: 0.1 });
+ await advanceTurns(30);
+ expect(mockGeminiClient.generateJson).toHaveBeenCalledTimes(1);
+ });
+
+ it('should detect a cognitive loop when confidence is high', async () => {
+ // First check at turn 30
+ mockGeminiClient.generateJson = vi
+ .fn()
+ .mockResolvedValue({ confidence: 0.85, reasoning: 'Repetitive actions' });
+ await advanceTurns(30);
+ expect(mockGeminiClient.generateJson).toHaveBeenCalledTimes(1);
+
+ // The confidence of 0.85 will result in a low interval.
+ // The interval will be: 5 + (15 - 5) * (1 - 0.85) = 5 + 10 * 0.15 = 6.5 -> rounded to 7
+ await advanceTurns(6); // advance to turn 36
+
+ mockGeminiClient.generateJson = vi
+ .fn()
+ .mockResolvedValue({ confidence: 0.95, reasoning: 'Repetitive actions' });
+ const finalResult = await service.turnStarted(abortController.signal); // This is turn 37
+
+ expect(finalResult).toBe(true);
+ expect(loggers.logLoopDetected).toHaveBeenCalledWith(
+ mockConfig,
+ expect.objectContaining({
+ 'event.name': 'loop_detected',
+ loop_type: LoopType.LLM_DETECTED_LOOP,
+ }),
+ );
+ });
+
+ it('should not detect a loop when confidence is low', async () => {
+ mockGeminiClient.generateJson = vi
+ .fn()
+ .mockResolvedValue({ confidence: 0.5, reasoning: 'Looks okay' });
+ await advanceTurns(30);
+ const result = await service.turnStarted(abortController.signal);
+ expect(result).toBe(false);
+ expect(loggers.logLoopDetected).not.toHaveBeenCalled();
+ });
+
+ it('should adjust the check interval based on confidence', async () => {
+ // Confidence is 0.0, so interval should be MAX_LLM_CHECK_INTERVAL (15)
+ mockGeminiClient.generateJson = vi
+ .fn()
+ .mockResolvedValue({ confidence: 0.0 });
+ await advanceTurns(30); // First check at turn 30
+ expect(mockGeminiClient.generateJson).toHaveBeenCalledTimes(1);
+
+ await advanceTurns(14); // Advance to turn 44
+ expect(mockGeminiClient.generateJson).toHaveBeenCalledTimes(1);
+
+ await service.turnStarted(abortController.signal); // Turn 45
+ expect(mockGeminiClient.generateJson).toHaveBeenCalledTimes(2);
+ });
+
+ it('should handle errors from generateJson gracefully', async () => {
+ mockGeminiClient.generateJson = vi
+ .fn()
+ .mockRejectedValue(new Error('API error'));
+ await advanceTurns(30);
+ const result = await service.turnStarted(abortController.signal);
+ expect(result).toBe(false);
+ expect(loggers.logLoopDetected).not.toHaveBeenCalled();
+ });
+});