summaryrefslogtreecommitdiff
path: root/integration-tests/run_shell_command.test.js
blob: 2a5f9ed400a1be577e2fa8f92d1fce61dd7a5572 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
/**
 * @license
 * Copyright 2025 Google LLC
 * SPDX-License-Identifier: Apache-2.0
 */

import { test } from 'node:test';
import { strict as assert } from 'assert';
import { TestRig, printDebugInfo, validateModelOutput } from './test-helper.js';

test('should be able to run a shell command', async () => {
  const rig = new TestRig();
  await rig.setup('should be able to run a shell command');

  const prompt = `Please run the command "echo hello-world" and show me the output`;

  const result = await rig.run(prompt);

  const foundToolCall = await rig.waitForToolCall('run_shell_command');

  // Add debugging information
  if (!foundToolCall || !result.includes('hello-world')) {
    printDebugInfo(rig, result, {
      'Found tool call': foundToolCall,
      'Contains hello-world': result.includes('hello-world'),
    });
  }

  assert.ok(foundToolCall, 'Expected to find a run_shell_command tool call');

  // Validate model output - will throw if no output, warn if missing expected content
  // Model often reports exit code instead of showing output
  validateModelOutput(
    result,
    ['hello-world', 'exit code 0'],
    'Shell command test',
  );
});

test('should be able to run a shell command via stdin', async () => {
  const rig = new TestRig();
  await rig.setup('should be able to run a shell command via stdin');

  const prompt = `Please run the command "echo test-stdin" and show me what it outputs`;

  const result = await rig.run({ stdin: prompt });

  const foundToolCall = await rig.waitForToolCall('run_shell_command');

  // Add debugging information
  if (!foundToolCall || !result.includes('test-stdin')) {
    printDebugInfo(rig, result, {
      'Test type': 'Stdin test',
      'Found tool call': foundToolCall,
      'Contains test-stdin': result.includes('test-stdin'),
    });
  }

  assert.ok(foundToolCall, 'Expected to find a run_shell_command tool call');

  // Validate model output - will throw if no output, warn if missing expected content
  validateModelOutput(result, 'test-stdin', 'Shell command stdin test');
});