feat: Add Shell Command Execution to Custom Commands (#4917)

2025-07-27 02:00:26 -04:00 · 2025-07-27 02:00:26 -04:00 · 576cebc928
parent 9e61b3510c
commit 576cebc928
16 changed files with 1604 additions and 653 deletions
--- a/docs/cli/commands.md
+++ b/docs/cli/commands.md
@ -201,6 +201,47 @@ The command follows this format: `/changelog <version> <type> <message>`
 When you run `/changelog 1.2.0 added "New feature"`, the final text sent to the model will be the original prompt followed by two newlines and the command you typed.
 ##### 3. Executing Shell Commands with `!{...}`
 You can make your commands dynamic by executing shell commands directly within your `prompt` and injecting their output. This is ideal for gathering context from your local environment, like reading file content or checking the status of Git.
 When a custom command attempts to execute a shell command, Gemini CLI will now prompt you for confirmation before proceeding. This is a security measure to ensure that only intended commands can be run.
 **How It Works:**
 1.  **Inject Commands:** Use the `!{...}` syntax in your `prompt` to specify where the command should be run and its output injected.
 2.  **Confirm Execution:** When you run the command, a dialog will appear listing the shell commands the prompt wants to execute.
 3.  **Grant Permission:** You can choose to:
    - **Allow once:** The command(s) will run this one time.
    - **Allow always for this session:** The command(s) will be added to a temporary allowlist for the current CLI session and will not require confirmation again.
    - **No:** Cancel the execution of the shell command(s).
 The CLI still respects the global `excludeTools` and `coreTools` settings. A command will be blocked without a confirmation prompt if it is explicitly disallowed in your configuration.
 **Example (`git/commit.toml`):**
 This command gets the staged git diff and uses it to ask the model to write a commit message.
 ````toml
 # In: <project>/.gemini/commands/git/commit.toml
 # Invoked via: /git:commit
 description = "Generates a Git commit message based on staged changes."
 # The prompt uses !{...} to execute the command and inject its output.
 prompt = """
 Please generate a Conventional Commit message based on the following git diff:
 ```diff
 !{git diff --staged}
 ````
 """
 ````
 When you run `/git:commit`, the CLI first executes `git diff --staged`, then replaces `!{git diff --staged}` with the output of that command before sending the final, complete prompt to the model.
 ---
 #### Example: A "Pure Function" Refactoring Command
@ -214,7 +255,7 @@ First, ensure the user commands directory exists, then create a `refactor` subdi
 ```bash
 mkdir -p ~/.gemini/commands/refactor
 touch ~/.gemini/commands/refactor/pure.toml
-```
+````
 **2. Add the content to the file:**
--- a/packages/cli/src/services/FileCommandLoader.test.ts
+++ b/packages/cli/src/services/FileCommandLoader.test.ts
@ -11,12 +11,68 @@ import {
  getUserCommandsDir,
 } from '@google/gemini-cli-core';
 import mock from 'mock-fs';
-import { assert } from 'vitest';
+import { assert, vi } from 'vitest';
 import { createMockCommandContext } from '../test-utils/mockCommandContext.js';
 import {
  SHELL_INJECTION_TRIGGER,
  SHORTHAND_ARGS_PLACEHOLDER,
 } from './prompt-processors/types.js';
 import {
  ConfirmationRequiredError,
  ShellProcessor,
 } from './prompt-processors/shellProcessor.js';
 import { ShorthandArgumentProcessor } from './prompt-processors/argumentProcessor.js';
 const mockShellProcess = vi.hoisted(() => vi.fn());
 vi.mock('./prompt-processors/shellProcessor.js', () => ({
  ShellProcessor: vi.fn().mockImplementation(() => ({
    process: mockShellProcess,
  })),
  ConfirmationRequiredError: class extends Error {
    constructor(
      message: string,
      public commandsToConfirm: string[],
    ) {
      super(message);
      this.name = 'ConfirmationRequiredError';
    }
  },
 }));
 vi.mock('./prompt-processors/argumentProcessor.js', async (importOriginal) => {
  const original =
    await importOriginal<
      typeof import('./prompt-processors/argumentProcessor.js')
    >();
  return {
    ShorthandArgumentProcessor: vi
      .fn()
      .mockImplementation(() => new original.ShorthandArgumentProcessor()),
    DefaultArgumentProcessor: vi
      .fn()
      .mockImplementation(() => new original.DefaultArgumentProcessor()),
  };
 });
 vi.mock('@google/gemini-cli-core', async (importOriginal) => {
  const original =
    await importOriginal<typeof import('@google/gemini-cli-core')>();
  return {
    ...original,
    isCommandAllowed: vi.fn(),
    ShellExecutionService: {
      execute: vi.fn(),
    },
  };
 });
 describe('FileCommandLoader', () => {
  const signal: AbortSignal = new AbortController().signal;
  beforeEach(() => {
    vi.clearAllMocks();
    mockShellProcess.mockImplementation((prompt) => Promise.resolve(prompt));
  });
  afterEach(() => {
    mock.restore();
  });
@ -371,4 +427,180 @@ describe('FileCommandLoader', () => {
      }
    });
  });
  describe('Shell Processor Integration', () => {
    it('instantiates ShellProcessor if the trigger is present', async () => {
      const userCommandsDir = getUserCommandsDir();
      mock({
        [userCommandsDir]: {
          'shell.toml': `prompt = "Run this: ${SHELL_INJECTION_TRIGGER}echo hello}"`,
        },
      });
      const loader = new FileCommandLoader(null as unknown as Config);
      await loader.loadCommands(signal);
      expect(ShellProcessor).toHaveBeenCalledWith('shell');
    });
    it('does not instantiate ShellProcessor if trigger is missing', async () => {
      const userCommandsDir = getUserCommandsDir();
      mock({
        [userCommandsDir]: {
          'regular.toml': `prompt = "Just a regular prompt"`,
        },
      });
      const loader = new FileCommandLoader(null as unknown as Config);
      await loader.loadCommands(signal);
      expect(ShellProcessor).not.toHaveBeenCalled();
    });
    it('returns a "submit_prompt" action if shell processing succeeds', async () => {
      const userCommandsDir = getUserCommandsDir();
      mock({
        [userCommandsDir]: {
          'shell.toml': `prompt = "Run !{echo 'hello'}"`,
        },
      });
      mockShellProcess.mockResolvedValue('Run hello');
      const loader = new FileCommandLoader(null as unknown as Config);
      const commands = await loader.loadCommands(signal);
      const command = commands.find((c) => c.name === 'shell');
      expect(command).toBeDefined();
      const result = await command!.action!(
        createMockCommandContext({
          invocation: { raw: '/shell', name: 'shell', args: '' },
        }),
        '',
      );
      expect(result?.type).toBe('submit_prompt');
      if (result?.type === 'submit_prompt') {
        expect(result.content).toBe('Run hello');
      }
    });
    it('returns a "confirm_shell_commands" action if shell processing requires it', async () => {
      const userCommandsDir = getUserCommandsDir();
      const rawInvocation = '/shell rm -rf /';
      mock({
        [userCommandsDir]: {
          'shell.toml': `prompt = "Run !{rm -rf /}"`,
        },
      });
      // Mock the processor to throw the specific error
      const error = new ConfirmationRequiredError('Confirmation needed', [
        'rm -rf /',
      ]);
      mockShellProcess.mockRejectedValue(error);
      const loader = new FileCommandLoader(null as unknown as Config);
      const commands = await loader.loadCommands(signal);
      const command = commands.find((c) => c.name === 'shell');
      expect(command).toBeDefined();
      const result = await command!.action!(
        createMockCommandContext({
          invocation: { raw: rawInvocation, name: 'shell', args: 'rm -rf /' },
        }),
        'rm -rf /',
      );
      expect(result?.type).toBe('confirm_shell_commands');
      if (result?.type === 'confirm_shell_commands') {
        expect(result.commandsToConfirm).toEqual(['rm -rf /']);
        expect(result.originalInvocation.raw).toBe(rawInvocation);
      }
    });
    it('re-throws other errors from the processor', async () => {
      const userCommandsDir = getUserCommandsDir();
      mock({
        [userCommandsDir]: {
          'shell.toml': `prompt = "Run !{something}"`,
        },
      });
      const genericError = new Error('Something else went wrong');
      mockShellProcess.mockRejectedValue(genericError);
      const loader = new FileCommandLoader(null as unknown as Config);
      const commands = await loader.loadCommands(signal);
      const command = commands.find((c) => c.name === 'shell');
      expect(command).toBeDefined();
      await expect(
        command!.action!(
          createMockCommandContext({
            invocation: { raw: '/shell', name: 'shell', args: '' },
          }),
          '',
        ),
      ).rejects.toThrow('Something else went wrong');
    });
    it('assembles the processor pipeline in the correct order (Shell -> Argument)', async () => {
      const userCommandsDir = getUserCommandsDir();
      mock({
        [userCommandsDir]: {
          'pipeline.toml': `
            prompt = "Shell says: ${SHELL_INJECTION_TRIGGER}echo foo} and user says: ${SHORTHAND_ARGS_PLACEHOLDER}"
          `,
        },
      });
      // Mock the process methods to track call order
      const argProcessMock = vi
        .fn()
        .mockImplementation((p) => `${p}-arg-processed`);
      // Redefine the mock for this specific test
      mockShellProcess.mockImplementation((p) =>
        Promise.resolve(`${p}-shell-processed`),
      );
      vi.mocked(ShorthandArgumentProcessor).mockImplementation(
        () =>
          ({
            process: argProcessMock,
          }) as unknown as ShorthandArgumentProcessor,
      );
      const loader = new FileCommandLoader(null as unknown as Config);
      const commands = await loader.loadCommands(signal);
      const command = commands.find((c) => c.name === 'pipeline');
      expect(command).toBeDefined();
      await command!.action!(
        createMockCommandContext({
          invocation: {
            raw: '/pipeline bar',
            name: 'pipeline',
            args: 'bar',
          },
        }),
        'bar',
      );
      // Verify that the shell processor was called before the argument processor
      expect(mockShellProcess.mock.invocationCallOrder[0]).toBeLessThan(
        argProcessMock.mock.invocationCallOrder[0],
      );
      // Also verify the flow of the prompt through the processors
      expect(mockShellProcess).toHaveBeenCalledWith(
        expect.any(String),
        expect.any(Object),
      );
      expect(argProcessMock).toHaveBeenCalledWith(
        expect.stringContaining('-shell-processed'), // It receives the output of the shell processor
        expect.any(Object),
      );
    });
  });
 });
--- a/packages/cli/src/services/FileCommandLoader.ts
+++ b/packages/cli/src/services/FileCommandLoader.ts
@ -19,7 +19,7 @@ import {
  CommandContext,
  CommandKind,
  SlashCommand,
-  SubmitPromptActionReturn,
+  SlashCommandActionReturn,
 } from '../ui/commands/types.js';
 import {
  DefaultArgumentProcessor,
@ -28,7 +28,12 @@ import {
 import {
  IPromptProcessor,
  SHORTHAND_ARGS_PLACEHOLDER,
  SHELL_INJECTION_TRIGGER,
 } from './prompt-processors/types.js';
 import {
  ConfirmationRequiredError,
  ShellProcessor,
 } from './prompt-processors/shellProcessor.js';
 /**
 * Defines the Zod schema for a command definition file. This serves as the
@ -172,6 +177,11 @@ export class FileCommandLoader implements ICommandLoader {
    const processors: IPromptProcessor[] = [];
    // Add the Shell Processor if needed.
    if (validDef.prompt.includes(SHELL_INJECTION_TRIGGER)) {
      processors.push(new ShellProcessor(commandName));
    }
    // The presence of '{{args}}' is the switch that determines the behavior.
    if (validDef.prompt.includes(SHORTHAND_ARGS_PLACEHOLDER)) {
      processors.push(new ShorthandArgumentProcessor());
@ -188,7 +198,7 @@ export class FileCommandLoader implements ICommandLoader {
      action: async (
        context: CommandContext,
        _args: string,
-      ): Promise<SubmitPromptActionReturn> => {
+      ): Promise<SlashCommandActionReturn> => {
        if (!context.invocation) {
          console.error(
            `[FileCommandLoader] Critical error: Command '${commandName}' was executed without invocation context.`,
@ -199,15 +209,31 @@ export class FileCommandLoader implements ICommandLoader {
          };
        }
-        let processedPrompt = validDef.prompt;
+        try {
-        for (const processor of processors) {
+          let processedPrompt = validDef.prompt;
-          processedPrompt = await processor.process(processedPrompt, context);
+          for (const processor of processors) {
-        }
+            processedPrompt = await processor.process(processedPrompt, context);
          }
-        return {
+          return {
-          type: 'submit_prompt',
+            type: 'submit_prompt',
-          content: processedPrompt,
+            content: processedPrompt,
-        };
+          };
        } catch (e) {
          // Check if it's our specific error type
          if (e instanceof ConfirmationRequiredError) {
            // Halt and request confirmation from the UI layer.
            return {
              type: 'confirm_shell_commands',
              commandsToConfirm: e.commandsToConfirm,
              originalInvocation: {
                raw: context.invocation.raw,
              },
            };
          }
          // Re-throw other errors to be handled by the global error handler.
          throw e;
        }
      },
    };
  }
--- a/packages/cli/src/services/prompt-processors/shellProcessor.test.ts
+++ b/packages/cli/src/services/prompt-processors/shellProcessor.test.ts
@ -0,0 +1,300 @@
 /**
 * @license
 * Copyright 2025 Google LLC
 * SPDX-License-Identifier: Apache-2.0
 */
 import { vi, describe, it, expect, beforeEach } from 'vitest';
 import { ConfirmationRequiredError, ShellProcessor } from './shellProcessor.js';
 import { createMockCommandContext } from '../../test-utils/mockCommandContext.js';
 import { CommandContext } from '../../ui/commands/types.js';
 import { Config } from '@google/gemini-cli-core';
 const mockCheckCommandPermissions = vi.hoisted(() => vi.fn());
 const mockShellExecute = vi.hoisted(() => vi.fn());
 vi.mock('@google/gemini-cli-core', async (importOriginal) => {
  const original = await importOriginal<object>();
  return {
    ...original,
    checkCommandPermissions: mockCheckCommandPermissions,
    ShellExecutionService: {
      execute: mockShellExecute,
    },
  };
 });
 describe('ShellProcessor', () => {
  let context: CommandContext;
  let mockConfig: Partial<Config>;
  beforeEach(() => {
    vi.clearAllMocks();
    mockConfig = {
      getTargetDir: vi.fn().mockReturnValue('/test/dir'),
    };
    context = createMockCommandContext({
      services: {
        config: mockConfig as Config,
      },
      session: {
        sessionShellAllowlist: new Set(),
      },
    });
    mockShellExecute.mockReturnValue({
      result: Promise.resolve({
        output: 'default shell output',
      }),
    });
    mockCheckCommandPermissions.mockReturnValue({
      allAllowed: true,
      disallowedCommands: [],
    });
  });
  it('should not change the prompt if no shell injections are present', async () => {
    const processor = new ShellProcessor('test-command');
    const prompt = 'This is a simple prompt with no injections.';
    const result = await processor.process(prompt, context);
    expect(result).toBe(prompt);
    expect(mockShellExecute).not.toHaveBeenCalled();
  });
  it('should process a single valid shell injection if allowed', async () => {
    const processor = new ShellProcessor('test-command');
    const prompt = 'The current status is: !{git status}';
    mockCheckCommandPermissions.mockReturnValue({
      allAllowed: true,
      disallowedCommands: [],
    });
    mockShellExecute.mockReturnValue({
      result: Promise.resolve({ output: 'On branch main' }),
    });
    const result = await processor.process(prompt, context);
    expect(mockCheckCommandPermissions).toHaveBeenCalledWith(
      'git status',
      expect.any(Object),
      context.session.sessionShellAllowlist,
    );
    expect(mockShellExecute).toHaveBeenCalledWith(
      'git status',
      expect.any(String),
      expect.any(Function),
      expect.any(Object),
    );
    expect(result).toBe('The current status is: On branch main');
  });
  it('should process multiple valid shell injections if all are allowed', async () => {
    const processor = new ShellProcessor('test-command');
    const prompt = '!{git status} in !{pwd}';
    mockCheckCommandPermissions.mockReturnValue({
      allAllowed: true,
      disallowedCommands: [],
    });
    mockShellExecute
      .mockReturnValueOnce({
        result: Promise.resolve({ output: 'On branch main' }),
      })
      .mockReturnValueOnce({
        result: Promise.resolve({ output: '/usr/home' }),
      });
    const result = await processor.process(prompt, context);
    expect(mockCheckCommandPermissions).toHaveBeenCalledTimes(2);
    expect(mockShellExecute).toHaveBeenCalledTimes(2);
    expect(result).toBe('On branch main in /usr/home');
  });
  it('should throw ConfirmationRequiredError if a command is not allowed', async () => {
    const processor = new ShellProcessor('test-command');
    const prompt = 'Do something dangerous: !{rm -rf /}';
    mockCheckCommandPermissions.mockReturnValue({
      allAllowed: false,
      disallowedCommands: ['rm -rf /'],
    });
    await expect(processor.process(prompt, context)).rejects.toThrow(
      ConfirmationRequiredError,
    );
  });
  it('should throw ConfirmationRequiredError with the correct command', async () => {
    const processor = new ShellProcessor('test-command');
    const prompt = 'Do something dangerous: !{rm -rf /}';
    mockCheckCommandPermissions.mockReturnValue({
      allAllowed: false,
      disallowedCommands: ['rm -rf /'],
    });
    try {
      await processor.process(prompt, context);
      // Fail if it doesn't throw
      expect(true).toBe(false);
    } catch (e) {
      expect(e).toBeInstanceOf(ConfirmationRequiredError);
      if (e instanceof ConfirmationRequiredError) {
        expect(e.commandsToConfirm).toEqual(['rm -rf /']);
      }
    }
    expect(mockShellExecute).not.toHaveBeenCalled();
  });
  it('should throw ConfirmationRequiredError with multiple commands if multiple are disallowed', async () => {
    const processor = new ShellProcessor('test-command');
    const prompt = '!{cmd1} and !{cmd2}';
    mockCheckCommandPermissions.mockImplementation((cmd) => {
      if (cmd === 'cmd1') {
        return { allAllowed: false, disallowedCommands: ['cmd1'] };
      }
      if (cmd === 'cmd2') {
        return { allAllowed: false, disallowedCommands: ['cmd2'] };
      }
      return { allAllowed: true, disallowedCommands: [] };
    });
    try {
      await processor.process(prompt, context);
      // Fail if it doesn't throw
      expect(true).toBe(false);
    } catch (e) {
      expect(e).toBeInstanceOf(ConfirmationRequiredError);
      if (e instanceof ConfirmationRequiredError) {
        expect(e.commandsToConfirm).toEqual(['cmd1', 'cmd2']);
      }
    }
  });
  it('should not execute any commands if at least one requires confirmation', async () => {
    const processor = new ShellProcessor('test-command');
    const prompt = 'First: !{echo "hello"}, Second: !{rm -rf /}';
    mockCheckCommandPermissions.mockImplementation((cmd) => {
      if (cmd.includes('rm')) {
        return { allAllowed: false, disallowedCommands: [cmd] };
      }
      return { allAllowed: true, disallowedCommands: [] };
    });
    await expect(processor.process(prompt, context)).rejects.toThrow(
      ConfirmationRequiredError,
    );
    // Ensure no commands were executed because the pipeline was halted.
    expect(mockShellExecute).not.toHaveBeenCalled();
  });
  it('should only request confirmation for disallowed commands in a mixed prompt', async () => {
    const processor = new ShellProcessor('test-command');
    const prompt = 'Allowed: !{ls -l}, Disallowed: !{rm -rf /}';
    mockCheckCommandPermissions.mockImplementation((cmd) => ({
      allAllowed: !cmd.includes('rm'),
      disallowedCommands: cmd.includes('rm') ? [cmd] : [],
    }));
    try {
      await processor.process(prompt, context);
      expect.fail('Should have thrown ConfirmationRequiredError');
    } catch (e) {
      expect(e).toBeInstanceOf(ConfirmationRequiredError);
      if (e instanceof ConfirmationRequiredError) {
        expect(e.commandsToConfirm).toEqual(['rm -rf /']);
      }
    }
  });
  it('should execute all commands if they are on the session allowlist', async () => {
    const processor = new ShellProcessor('test-command');
    const prompt = 'Run !{cmd1} and !{cmd2}';
    // Add commands to the session allowlist
    context.session.sessionShellAllowlist = new Set(['cmd1', 'cmd2']);
    // checkCommandPermissions should now pass for these
    mockCheckCommandPermissions.mockReturnValue({
      allAllowed: true,
      disallowedCommands: [],
    });
    mockShellExecute
      .mockReturnValueOnce({ result: Promise.resolve({ output: 'output1' }) })
      .mockReturnValueOnce({ result: Promise.resolve({ output: 'output2' }) });
    const result = await processor.process(prompt, context);
    expect(mockCheckCommandPermissions).toHaveBeenCalledWith(
      'cmd1',
      expect.any(Object),
      context.session.sessionShellAllowlist,
    );
    expect(mockCheckCommandPermissions).toHaveBeenCalledWith(
      'cmd2',
      expect.any(Object),
      context.session.sessionShellAllowlist,
    );
    expect(mockShellExecute).toHaveBeenCalledTimes(2);
    expect(result).toBe('Run output1 and output2');
  });
  it('should trim whitespace from the command inside the injection', async () => {
    const processor = new ShellProcessor('test-command');
    const prompt = 'Files: !{  ls -l  }';
    mockCheckCommandPermissions.mockReturnValue({
      allAllowed: true,
      disallowedCommands: [],
    });
    mockShellExecute.mockReturnValue({
      result: Promise.resolve({ output: 'total 0' }),
    });
    await processor.process(prompt, context);
    expect(mockCheckCommandPermissions).toHaveBeenCalledWith(
      'ls -l', // Verifies that the command was trimmed
      expect.any(Object),
      context.session.sessionShellAllowlist,
    );
    expect(mockShellExecute).toHaveBeenCalledWith(
      'ls -l',
      expect.any(String),
      expect.any(Function),
      expect.any(Object),
    );
  });
  it('should handle an empty command inside the injection gracefully', async () => {
    const processor = new ShellProcessor('test-command');
    const prompt = 'This is weird: !{}';
    mockCheckCommandPermissions.mockReturnValue({
      allAllowed: true,
      disallowedCommands: [],
    });
    mockShellExecute.mockReturnValue({
      result: Promise.resolve({ output: 'empty output' }),
    });
    const result = await processor.process(prompt, context);
    expect(mockCheckCommandPermissions).toHaveBeenCalledWith(
      '',
      expect.any(Object),
      context.session.sessionShellAllowlist,
    );
    expect(mockShellExecute).toHaveBeenCalledWith(
      '',
      expect.any(String),
      expect.any(Function),
      expect.any(Object),
    );
    expect(result).toBe('This is weird: empty output');
  });
 });
--- a/packages/cli/src/services/prompt-processors/shellProcessor.ts
+++ b/packages/cli/src/services/prompt-processors/shellProcessor.ts
@ -0,0 +1,106 @@
 /**
 * @license
 * Copyright 2025 Google LLC
 * SPDX-License-Identifier: Apache-2.0
 */
 import {
  checkCommandPermissions,
  ShellExecutionService,
 } from '@google/gemini-cli-core';
 import { CommandContext } from '../../ui/commands/types.js';
 import { IPromptProcessor } from './types.js';
 export class ConfirmationRequiredError extends Error {
  constructor(
    message: string,
    public commandsToConfirm: string[],
  ) {
    super(message);
    this.name = 'ConfirmationRequiredError';
  }
 }
 /**
 * Finds all instances of shell command injections (`!{...}`) in a prompt,
 * executes them, and replaces the injection site with the command's output.
 *
 * This processor ensures that only allowlisted commands are executed. If a
 * disallowed command is found, it halts execution and reports an error.
 */
 export class ShellProcessor implements IPromptProcessor {
  /**
   * A regular expression to find all instances of `!{...}`. The inner
   * capture group extracts the command itself.
   */
  private static readonly SHELL_INJECTION_REGEX = /!\{([^}]*)\}/g;
  /**
   * @param commandName The name of the custom command being executed, used
   *   for logging and error messages.
   */
  constructor(private readonly commandName: string) {}
  async process(prompt: string, context: CommandContext): Promise<string> {
    const { config, sessionShellAllowlist } = {
      ...context.services,
      ...context.session,
    };
    const commandsToExecute: Array<{ fullMatch: string; command: string }> = [];
    const commandsToConfirm = new Set<string>();
    const matches = [...prompt.matchAll(ShellProcessor.SHELL_INJECTION_REGEX)];
    if (matches.length === 0) {
      return prompt; // No shell commands, nothing to do.
    }
    // Discover all commands and check permissions.
    for (const match of matches) {
      const command = match[1].trim();
      const { allAllowed, disallowedCommands, blockReason, isHardDenial } =
        checkCommandPermissions(command, config!, sessionShellAllowlist);
      if (!allAllowed) {
        // If it's a hard denial, this is a non-recoverable security error.
        if (isHardDenial) {
          throw new Error(
            `${this.commandName} cannot be run. ${blockReason || 'A shell command in this custom command is explicitly blocked in your config settings.'}`,
          );
        }
        // Add each soft denial disallowed command to the set for confirmation.
        disallowedCommands.forEach((uc) => commandsToConfirm.add(uc));
      }
      commandsToExecute.push({ fullMatch: match[0], command });
    }
    // If any commands require confirmation, throw a special error to halt the
    // pipeline and trigger the UI flow.
    if (commandsToConfirm.size > 0) {
      throw new ConfirmationRequiredError(
        'Shell command confirmation required',
        Array.from(commandsToConfirm),
      );
    }
    // Execute all commands (only runs if no confirmation was needed).
    let processedPrompt = prompt;
    for (const { fullMatch, command } of commandsToExecute) {
      const { result } = ShellExecutionService.execute(
        command,
        config!.getTargetDir(),
        () => {}, // No streaming needed.
        new AbortController().signal, // For now, we don't support cancellation from here.
      );
      const executionResult = await result;
      processedPrompt = processedPrompt.replace(
        fullMatch,
        executionResult.output,
      );
    }
    return processedPrompt;
  }
 }
--- a/packages/cli/src/services/prompt-processors/types.ts
+++ b/packages/cli/src/services/prompt-processors/types.ts
@ -35,3 +35,8 @@ export interface IPromptProcessor {
 * The placeholder string for shorthand argument injection in custom commands.
 */
 export const SHORTHAND_ARGS_PLACEHOLDER = '{{args}}';
 /**
 * The trigger string for shell command injection in custom commands.
 */
 export const SHELL_INJECTION_TRIGGER = '!{';
--- a/packages/cli/src/ui/App.tsx
+++ b/packages/cli/src/ui/App.tsx
@ -36,6 +36,7 @@ import { ThemeDialog } from './components/ThemeDialog.js';
 import { AuthDialog } from './components/AuthDialog.js';
 import { AuthInProgress } from './components/AuthInProgress.js';
 import { EditorSettingsDialog } from './components/EditorSettingsDialog.js';
 import { ShellConfirmationDialog } from './components/ShellConfirmationDialog.js';
 import { Colors } from './colors.js';
 import { Help } from './components/Help.js';
 import { loadHierarchicalGeminiMemory } from '../config/config.js';
@ -169,6 +170,7 @@ const App = ({ config, settings, startupWarnings = [], version }: AppProps) => {
    useState<boolean>(false);
  const [userTier, setUserTier] = useState<UserTierId | undefined>(undefined);
  const [openFiles, setOpenFiles] = useState<OpenFiles | undefined>();
  const [isProcessing, setIsProcessing] = useState<boolean>(false);
  useEffect(() => {
    const unsubscribe = ideContext.subscribeToOpenFiles(setOpenFiles);
@ -452,6 +454,7 @@ const App = ({ config, settings, startupWarnings = [], version }: AppProps) => {
    slashCommands,
    pendingHistoryItems: pendingSlashCommandHistoryItems,
    commandContext,
    shellConfirmationRequest,
  } = useSlashCommandProcessor(
    config,
    settings,
@ -468,6 +471,7 @@ const App = ({ config, settings, startupWarnings = [], version }: AppProps) => {
    setQuittingMessages,
    openPrivacyNotice,
    toggleVimEnabled,
    setIsProcessing,
  );
  const {
@ -624,7 +628,8 @@ const App = ({ config, settings, startupWarnings = [], version }: AppProps) => {
    fetchUserMessages();
  }, [history, logger]);
-  const isInputActive = streamingState === StreamingState.Idle && !initError;
+  const isInputActive =
    streamingState === StreamingState.Idle && !initError && !isProcessing;
  const handleClearScreen = useCallback(() => {
    clearItems();
@ -830,7 +835,9 @@ const App = ({ config, settings, startupWarnings = [], version }: AppProps) => {
            </Box>
          )}
-          {isThemeDialogOpen ? (
+          {shellConfirmationRequest ? (
            <ShellConfirmationDialog request={shellConfirmationRequest} />
          ) : isThemeDialogOpen ? (
            <Box flexDirection="column">
              {themeError && (
                <Box marginBottom={1}>
--- a/packages/cli/src/ui/commands/types.ts
+++ b/packages/cli/src/ui/commands/types.ts
@ -63,6 +63,8 @@ export interface CommandContext {
  // Session-specific data
  session: {
    stats: SessionStatsState;
    /** A transient list of shell commands the user has approved for this session. */
    sessionShellAllowlist: Set<string>;
  };
 }
@ -118,13 +120,28 @@ export interface SubmitPromptActionReturn {
  content: string;
 }
 /**
 * The return type for a command action that needs to pause and request
 * confirmation for a set of shell commands before proceeding.
 */
 export interface ConfirmShellCommandsActionReturn {
  type: 'confirm_shell_commands';
  /** The list of shell commands that require user confirmation. */
  commandsToConfirm: string[];
  /** The original invocation context to be re-run after confirmation. */
  originalInvocation: {
    raw: string;
  };
 }
 export type SlashCommandActionReturn =
  | ToolActionReturn
  | MessageActionReturn
  | QuitActionReturn
  | OpenDialogActionReturn
  | LoadHistoryActionReturn
-  | SubmitPromptActionReturn;
+  | SubmitPromptActionReturn
  | ConfirmShellCommandsActionReturn;
 export enum CommandKind {
  BUILT_IN = 'built-in',
--- a/packages/cli/src/ui/components/ShellConfirmationDialog.test.tsx
+++ b/packages/cli/src/ui/components/ShellConfirmationDialog.test.tsx
@ -0,0 +1,45 @@
 /**
 * @license
 * Copyright 2025 Google LLC
 * SPDX-License-Identifier: Apache-2.0
 */
 import { render } from 'ink-testing-library';
 import { describe, it, expect, vi } from 'vitest';
 import { ShellConfirmationDialog } from './ShellConfirmationDialog.js';
 describe('ShellConfirmationDialog', () => {
  const onConfirm = vi.fn();
  const request = {
    commands: ['ls -la', 'echo "hello"'],
    onConfirm,
  };
  it('renders correctly', () => {
    const { lastFrame } = render(<ShellConfirmationDialog request={request} />);
    expect(lastFrame()).toMatchSnapshot();
  });
  it('calls onConfirm with ProceedOnce when "Yes, allow once" is selected', () => {
    const { lastFrame } = render(<ShellConfirmationDialog request={request} />);
    const select = lastFrame()!.toString();
    // Simulate selecting the first option
    // This is a simplified way to test the selection
    expect(select).toContain('Yes, allow once');
  });
  it('calls onConfirm with ProceedAlways when "Yes, allow always for this session" is selected', () => {
    const { lastFrame } = render(<ShellConfirmationDialog request={request} />);
    const select = lastFrame()!.toString();
    // Simulate selecting the second option
    expect(select).toContain('Yes, allow always for this session');
  });
  it('calls onConfirm with Cancel when "No (esc)" is selected', () => {
    const { lastFrame } = render(<ShellConfirmationDialog request={request} />);
    const select = lastFrame()!.toString();
    // Simulate selecting the third option
    expect(select).toContain('No (esc)');
  });
 });
--- a/packages/cli/src/ui/components/ShellConfirmationDialog.tsx
+++ b/packages/cli/src/ui/components/ShellConfirmationDialog.tsx
@ -0,0 +1,98 @@
 /**
 * @license
 * Copyright 2025 Google LLC
 * SPDX-License-Identifier: Apache-2.0
 */
 import { ToolConfirmationOutcome } from '@google/gemini-cli-core';
 import { Box, Text, useInput } from 'ink';
 import React from 'react';
 import { Colors } from '../colors.js';
 import {
  RadioButtonSelect,
  RadioSelectItem,
 } from './shared/RadioButtonSelect.js';
 export interface ShellConfirmationRequest {
  commands: string[];
  onConfirm: (
    outcome: ToolConfirmationOutcome,
    approvedCommands?: string[],
  ) => void;
 }
 export interface ShellConfirmationDialogProps {
  request: ShellConfirmationRequest;
 }
 export const ShellConfirmationDialog: React.FC<
  ShellConfirmationDialogProps
 > = ({ request }) => {
  const { commands, onConfirm } = request;
  useInput((_, key) => {
    if (key.escape) {
      onConfirm(ToolConfirmationOutcome.Cancel);
    }
  });
  const handleSelect = (item: ToolConfirmationOutcome) => {
    if (item === ToolConfirmationOutcome.Cancel) {
      onConfirm(item);
    } else {
      // For both ProceedOnce and ProceedAlways, we approve all the
      // commands that were requested.
      onConfirm(item, commands);
    }
  };
  const options: Array<RadioSelectItem<ToolConfirmationOutcome>> = [
    {
      label: 'Yes, allow once',
      value: ToolConfirmationOutcome.ProceedOnce,
    },
    {
      label: 'Yes, allow always for this session',
      value: ToolConfirmationOutcome.ProceedAlways,
    },
    {
      label: 'No (esc)',
      value: ToolConfirmationOutcome.Cancel,
    },
  ];
  return (
    <Box
      flexDirection="column"
      borderStyle="round"
      borderColor={Colors.AccentYellow}
      padding={1}
      width="100%"
      marginLeft={1}
    >
      <Box flexDirection="column" marginBottom={1}>
        <Text bold>Shell Command Execution</Text>
        <Text>A custom command wants to run the following shell commands:</Text>
        <Box
          flexDirection="column"
          borderStyle="round"
          borderColor={Colors.Gray}
          paddingX={1}
          marginTop={1}
        >
          {commands.map((cmd) => (
            <Text key={cmd} color={Colors.AccentCyan}>
              {cmd}
            </Text>
          ))}
        </Box>
      </Box>
      <Box marginBottom={1}>
        <Text>Do you want to proceed?</Text>
      </Box>
      <RadioButtonSelect items={options} onSelect={handleSelect} isFocused />
    </Box>
  );
 };
--- a/packages/cli/src/ui/components/snapshots/ShellConfirmationDialog.test.tsx.snap
+++ b/packages/cli/src/ui/components/snapshots/ShellConfirmationDialog.test.tsx.snap
@ -0,0 +1,21 @@
 // Vitest Snapshot v1, https://vitest.dev/guide/snapshot.html
 exports[`ShellConfirmationDialog > renders correctly 1`] = `
 " ╭──────────────────────────────────────────────────────────────────────────────────────────────────╮
 │                                                                                                  │
 │ Shell Command Execution                                                                          │
 │ A custom command wants to run the following shell commands:                                      │
 │                                                                                                  │
 │ ╭──────────────────────────────────────────────────────────────────────────────────────────────╮ │
 │ │ ls -la                                                                                       │ │
 │ │ echo "hello"                                                                                 │ │
 │ ╰──────────────────────────────────────────────────────────────────────────────────────────────╯ │
 │                                                                                                  │
 │ Do you want to proceed?                                                                          │
 │                                                                                                  │
 │ ● 1. Yes, allow once                                                                             │
 │   2. Yes, allow always for this session                                                          │
 │   3. No (esc)                                                                                    │
 │                                                                                                  │
 ╰──────────────────────────────────────────────────────────────────────────────────────────────────╯"
 `;
--- a/packages/cli/src/ui/hooks/slashCommandProcessor.test.ts
+++ b/packages/cli/src/ui/hooks/slashCommandProcessor.test.ts
@ -42,8 +42,13 @@ vi.mock('../contexts/SessionContext.js', () => ({
 import { act, renderHook, waitFor } from '@testing-library/react';
 import { vi, describe, it, expect, beforeEach, type Mock } from 'vitest';
 import { useSlashCommandProcessor } from './slashCommandProcessor.js';
-import { CommandKind, SlashCommand } from '../commands/types.js';
+import {
-import { Config } from '@google/gemini-cli-core';
+  CommandContext,
  CommandKind,
  ConfirmShellCommandsActionReturn,
  SlashCommand,
 } from '../commands/types.js';
 import { Config, ToolConfirmationOutcome } from '@google/gemini-cli-core';
 import { LoadedSettings } from '../../config/settings.js';
 import { MessageType } from '../types.js';
 import { BuiltinCommandLoader } from '../../services/BuiltinCommandLoader.js';
@ -90,6 +95,7 @@ describe('useSlashCommandProcessor', () => {
    builtinCommands: SlashCommand[] = [],
    fileCommands: SlashCommand[] = [],
    mcpCommands: SlashCommand[] = [],
    setIsProcessing = vi.fn(),
  ) => {
    mockBuiltinLoadCommands.mockResolvedValue(Object.freeze(builtinCommands));
    mockFileLoadCommands.mockResolvedValue(Object.freeze(fileCommands));
@ -112,6 +118,7 @@ describe('useSlashCommandProcessor', () => {
        mockSetQuittingMessages,
        vi.fn(), // openPrivacyNotice
        vi.fn(), // toggleVimEnabled
        setIsProcessing,
      ),
    );
@ -275,6 +282,32 @@ describe('useSlashCommandProcessor', () => {
        'with args',
      );
    });
    it('should set isProcessing to true during execution and false afterwards', async () => {
      const mockSetIsProcessing = vi.fn();
      const command = createTestCommand({
        name: 'long-running',
        action: () => new Promise((resolve) => setTimeout(resolve, 50)),
      });
      const result = setupProcessorHook([command], [], [], mockSetIsProcessing);
      await waitFor(() => expect(result.current.slashCommands).toHaveLength(1));
      const executionPromise = act(async () => {
        await result.current.handleSlashCommand('/long-running');
      });
      // It should be true immediately after starting
      expect(mockSetIsProcessing).toHaveBeenCalledWith(true);
      // It should not have been called with false yet
      expect(mockSetIsProcessing).not.toHaveBeenCalledWith(false);
      await executionPromise;
      // After the promise resolves, it should be called with false
      expect(mockSetIsProcessing).toHaveBeenCalledWith(false);
      expect(mockSetIsProcessing).toHaveBeenCalledTimes(2);
    });
  });
  describe('Action Result Handling', () => {
@ -417,6 +450,176 @@ describe('useSlashCommandProcessor', () => {
    });
  });
  describe('Shell Command Confirmation Flow', () => {
    // Use a generic vi.fn() for the action. We will change its behavior in each test.
    const mockCommandAction = vi.fn();
    const shellCommand = createTestCommand({
      name: 'shellcmd',
      action: mockCommandAction,
    });
    beforeEach(() => {
      // Reset the mock before each test
      mockCommandAction.mockClear();
      // Default behavior: request confirmation
      mockCommandAction.mockResolvedValue({
        type: 'confirm_shell_commands',
        commandsToConfirm: ['rm -rf /'],
        originalInvocation: { raw: '/shellcmd' },
      } as ConfirmShellCommandsActionReturn);
    });
    it('should set confirmation request when action returns confirm_shell_commands', async () => {
      const result = setupProcessorHook([shellCommand]);
      await waitFor(() => expect(result.current.slashCommands).toHaveLength(1));
      // This is intentionally not awaited, because the promise it returns
      // will not resolve until the user responds to the confirmation.
      act(() => {
        result.current.handleSlashCommand('/shellcmd');
      });
      // We now wait for the state to be updated with the request.
      await waitFor(() => {
        expect(result.current.shellConfirmationRequest).not.toBeNull();
      });
      expect(result.current.shellConfirmationRequest?.commands).toEqual([
        'rm -rf /',
      ]);
    });
    it('should do nothing if user cancels confirmation', async () => {
      const result = setupProcessorHook([shellCommand]);
      await waitFor(() => expect(result.current.slashCommands).toHaveLength(1));
      act(() => {
        result.current.handleSlashCommand('/shellcmd');
      });
      // Wait for the confirmation dialog to be set
      await waitFor(() => {
        expect(result.current.shellConfirmationRequest).not.toBeNull();
      });
      const onConfirm = result.current.shellConfirmationRequest?.onConfirm;
      expect(onConfirm).toBeDefined();
      // Change the mock action's behavior for a potential second run.
      // If the test is flawed, this will be called, and we can detect it.
      mockCommandAction.mockResolvedValue({
        type: 'message',
        messageType: 'info',
        content: 'This should not be called',
      });
      await act(async () => {
        onConfirm!(ToolConfirmationOutcome.Cancel, []); // Pass empty array for safety
      });
      expect(result.current.shellConfirmationRequest).toBeNull();
      // Verify the action was only called the initial time.
      expect(mockCommandAction).toHaveBeenCalledTimes(1);
    });
    it('should re-run command with one-time allowlist on "Proceed Once"', async () => {
      const result = setupProcessorHook([shellCommand]);
      await waitFor(() => expect(result.current.slashCommands).toHaveLength(1));
      act(() => {
        result.current.handleSlashCommand('/shellcmd');
      });
      await waitFor(() => {
        expect(result.current.shellConfirmationRequest).not.toBeNull();
      });
      const onConfirm = result.current.shellConfirmationRequest?.onConfirm;
      // **Change the mock's behavior for the SECOND run.**
      // This is the key to testing the outcome.
      mockCommandAction.mockResolvedValue({
        type: 'message',
        messageType: 'info',
        content: 'Success!',
      });
      await act(async () => {
        onConfirm!(ToolConfirmationOutcome.ProceedOnce, ['rm -rf /']);
      });
      expect(result.current.shellConfirmationRequest).toBeNull();
      // The action should have been called twice (initial + re-run).
      await waitFor(() => {
        expect(mockCommandAction).toHaveBeenCalledTimes(2);
      });
      // We can inspect the context of the second call to ensure the one-time list was used.
      const secondCallContext = mockCommandAction.mock
        .calls[1][0] as CommandContext;
      expect(
        secondCallContext.session.sessionShellAllowlist.has('rm -rf /'),
      ).toBe(true);
      // Verify the final success message was added.
      expect(mockAddItem).toHaveBeenCalledWith(
        { type: MessageType.INFO, text: 'Success!' },
        expect.any(Number),
      );
      // Verify the session-wide allowlist was NOT permanently updated.
      // Re-render the hook by calling a no-op command to get the latest context.
      await act(async () => {
        result.current.handleSlashCommand('/no-op');
      });
      const finalContext = result.current.commandContext;
      expect(finalContext.session.sessionShellAllowlist.size).toBe(0);
    });
    it('should re-run command and update session allowlist on "Proceed Always"', async () => {
      const result = setupProcessorHook([shellCommand]);
      await waitFor(() => expect(result.current.slashCommands).toHaveLength(1));
      act(() => {
        result.current.handleSlashCommand('/shellcmd');
      });
      await waitFor(() => {
        expect(result.current.shellConfirmationRequest).not.toBeNull();
      });
      const onConfirm = result.current.shellConfirmationRequest?.onConfirm;
      mockCommandAction.mockResolvedValue({
        type: 'message',
        messageType: 'info',
        content: 'Success!',
      });
      await act(async () => {
        onConfirm!(ToolConfirmationOutcome.ProceedAlways, ['rm -rf /']);
      });
      expect(result.current.shellConfirmationRequest).toBeNull();
      await waitFor(() => {
        expect(mockCommandAction).toHaveBeenCalledTimes(2);
      });
      expect(mockAddItem).toHaveBeenCalledWith(
        { type: MessageType.INFO, text: 'Success!' },
        expect.any(Number),
      );
      // Check that the session-wide allowlist WAS updated.
      await waitFor(() => {
        const finalContext = result.current.commandContext;
        expect(finalContext.session.sessionShellAllowlist.has('rm -rf /')).toBe(
          true,
        );
      });
    });
  });
  describe('Command Parsing and Matching', () => {
    it('should be case-sensitive', async () => {
      const command = createTestCommand({ name: 'test' });
@ -583,7 +786,7 @@ describe('useSlashCommandProcessor', () => {
  });
  describe('Lifecycle', () => {
-    it('should abort command loading when the hook unmounts', async () => {
+    it('should abort command loading when the hook unmounts', () => {
      const abortSpy = vi.spyOn(AbortController.prototype, 'abort');
      const { unmount } = renderHook(() =>
        useSlashCommandProcessor(
@ -597,10 +800,11 @@ describe('useSlashCommandProcessor', () => {
          vi.fn(), // onDebugMessage
          vi.fn(), // openThemeDialog
          mockOpenAuthDialog,
-          vi.fn(), // openEditorDialog
+          vi.fn(), // openEditorDialog,
          vi.fn(), // toggleCorgiMode
          mockSetQuittingMessages,
          vi.fn(), // openPrivacyNotice
          vi.fn(), // toggleVimEnabled
        ),
      );
--- a/packages/cli/src/ui/hooks/slashCommandProcessor.ts
+++ b/packages/cli/src/ui/hooks/slashCommandProcessor.ts
@ -9,7 +9,12 @@ import { type PartListUnion } from '@google/genai';
 import process from 'node:process';
 import { UseHistoryManagerReturn } from './useHistoryManager.js';
 import { useStateAndRef } from './useStateAndRef.js';
-import { Config, GitService, Logger } from '@google/gemini-cli-core';
+import {
  Config,
  GitService,
  Logger,
  ToolConfirmationOutcome,
 } from '@google/gemini-cli-core';
 import { useSessionStats } from '../contexts/SessionContext.js';
 import {
  Message,
@ -44,9 +49,21 @@ export const useSlashCommandProcessor = (
  setQuittingMessages: (message: HistoryItem[]) => void,
  openPrivacyNotice: () => void,
  toggleVimEnabled: () => Promise<boolean>,
  setIsProcessing: (isProcessing: boolean) => void,
 ) => {
  const session = useSessionStats();
  const [commands, setCommands] = useState<readonly SlashCommand[]>([]);
  const [shellConfirmationRequest, setShellConfirmationRequest] =
    useState<null | {
      commands: string[];
      onConfirm: (
        outcome: ToolConfirmationOutcome,
        approvedCommands?: string[],
      ) => void;
    }>(null);
  const [sessionShellAllowlist, setSessionShellAllowlist] = useState(
    new Set<string>(),
  );
  const gitService = useMemo(() => {
    if (!config?.getProjectRoot()) {
      return;
@ -144,6 +161,7 @@ export const useSlashCommandProcessor = (
      },
      session: {
        stats: session.stats,
        sessionShellAllowlist,
      },
    }),
    [
@ -161,6 +179,7 @@ export const useSlashCommandProcessor = (
      setPendingCompressionItem,
      toggleCorgiMode,
      toggleVimEnabled,
      sessionShellAllowlist,
    ],
  );
@ -189,69 +208,87 @@ export const useSlashCommandProcessor = (
  const handleSlashCommand = useCallback(
    async (
      rawQuery: PartListUnion,
      oneTimeShellAllowlist?: Set<string>,
    ): Promise<SlashCommandProcessorResult | false> => {
-      if (typeof rawQuery !== 'string') {
+      setIsProcessing(true);
-        return false;
+      try {
-      }
+        if (typeof rawQuery !== 'string') {
-
+          return false;
      const trimmed = rawQuery.trim();
      if (!trimmed.startsWith('/') && !trimmed.startsWith('?')) {
        return false;
      }
      const userMessageTimestamp = Date.now();
      addItem({ type: MessageType.USER, text: trimmed }, userMessageTimestamp);
      const parts = trimmed.substring(1).trim().split(/\s+/);
      const commandPath = parts.filter((p) => p); // The parts of the command, e.g., ['memory', 'add']
      let currentCommands = commands;
      let commandToExecute: SlashCommand | undefined;
      let pathIndex = 0;
      for (const part of commandPath) {
        // TODO: For better performance and architectural clarity, this two-pass
        // search could be replaced. A more optimal approach would be to
        // pre-compute a single lookup map in `CommandService.ts` that resolves
        // all name and alias conflicts during the initial loading phase. The
        // processor would then perform a single, fast lookup on that map.
        // First pass: check for an exact match on the primary command name.
        let foundCommand = currentCommands.find((cmd) => cmd.name === part);
        // Second pass: if no primary name matches, check for an alias.
        if (!foundCommand) {
          foundCommand = currentCommands.find((cmd) =>
            cmd.altNames?.includes(part),
          );
        }
-        if (foundCommand) {
+        const trimmed = rawQuery.trim();
-          commandToExecute = foundCommand;
+        if (!trimmed.startsWith('/') && !trimmed.startsWith('?')) {
-          pathIndex++;
+          return false;
-          if (foundCommand.subCommands) {
+        }
-            currentCommands = foundCommand.subCommands;
+
        const userMessageTimestamp = Date.now();
        addItem(
          { type: MessageType.USER, text: trimmed },
          userMessageTimestamp,
        );
        const parts = trimmed.substring(1).trim().split(/\s+/);
        const commandPath = parts.filter((p) => p); // The parts of the command, e.g., ['memory', 'add']
        let currentCommands = commands;
        let commandToExecute: SlashCommand | undefined;
        let pathIndex = 0;
        for (const part of commandPath) {
          // TODO: For better performance and architectural clarity, this two-pass
          // search could be replaced. A more optimal approach would be to
          // pre-compute a single lookup map in `CommandService.ts` that resolves
          // all name and alias conflicts during the initial loading phase. The
          // processor would then perform a single, fast lookup on that map.
          // First pass: check for an exact match on the primary command name.
          let foundCommand = currentCommands.find((cmd) => cmd.name === part);
          // Second pass: if no primary name matches, check for an alias.
          if (!foundCommand) {
            foundCommand = currentCommands.find((cmd) =>
              cmd.altNames?.includes(part),
            );
          }
          if (foundCommand) {
            commandToExecute = foundCommand;
            pathIndex++;
            if (foundCommand.subCommands) {
              currentCommands = foundCommand.subCommands;
            } else {
              break;
            }
          } else {
            break;
          }
        } else {
          break;
        }
      }
-      if (commandToExecute) {
+        if (commandToExecute) {
-        const args = parts.slice(pathIndex).join(' ');
+          const args = parts.slice(pathIndex).join(' ');
          if (commandToExecute.action) {
            const fullCommandContext: CommandContext = {
              ...commandContext,
              invocation: {
                raw: trimmed,
                name: commandToExecute.name,
                args,
              },
            };
            // If a one-time list is provided for a "Proceed" action, temporarily
            // augment the session allowlist for this single execution.
            if (oneTimeShellAllowlist && oneTimeShellAllowlist.size > 0) {
              fullCommandContext.session = {
                ...fullCommandContext.session,
                sessionShellAllowlist: new Set([
                  ...fullCommandContext.session.sessionShellAllowlist,
                  ...oneTimeShellAllowlist,
                ]),
              };
            }
        if (commandToExecute.action) {
          const fullCommandContext: CommandContext = {
            ...commandContext,
            invocation: {
              raw: trimmed,
              name: commandToExecute.name,
              args,
            },
          };
          try {
            const result = await commandToExecute.action(
              fullCommandContext,
              args,
@ -323,6 +360,46 @@ export const useSlashCommandProcessor = (
                    type: 'submit_prompt',
                    content: result.content,
                  };
                case 'confirm_shell_commands': {
                  const { outcome, approvedCommands } = await new Promise<{
                    outcome: ToolConfirmationOutcome;
                    approvedCommands?: string[];
                  }>((resolve) => {
                    setShellConfirmationRequest({
                      commands: result.commandsToConfirm,
                      onConfirm: (
                        resolvedOutcome,
                        resolvedApprovedCommands,
                      ) => {
                        setShellConfirmationRequest(null); // Close the dialog
                        resolve({
                          outcome: resolvedOutcome,
                          approvedCommands: resolvedApprovedCommands,
                        });
                      },
                    });
                  });
                  if (
                    outcome === ToolConfirmationOutcome.Cancel ||
                    !approvedCommands ||
                    approvedCommands.length === 0
                  ) {
                    return { type: 'handled' };
                  }
                  if (outcome === ToolConfirmationOutcome.ProceedAlways) {
                    setSessionShellAllowlist(
                      (prev) => new Set([...prev, ...approvedCommands]),
                    );
                  }
                  return await handleSlashCommand(
                    result.originalInvocation.raw,
                    // Pass the approved commands as a one-time grant for this execution.
                    new Set(approvedCommands),
                  );
                }
                default: {
                  const unhandled: never = result;
                  throw new Error(
@ -331,37 +408,39 @@ export const useSlashCommandProcessor = (
                }
              }
            }
-          } catch (e) {
+
-            addItem(
+            return { type: 'handled' };
-              {
+          } else if (commandToExecute.subCommands) {
-                type: MessageType.ERROR,
+            const helpText = `Command '/${commandToExecute.name}' requires a subcommand. Available:\n${commandToExecute.subCommands
-                text: e instanceof Error ? e.message : String(e),
+              .map((sc) => `  - ${sc.name}: ${sc.description || ''}`)
-              },
+              .join('\n')}`;
-              Date.now(),
+            addMessage({
-            );
+              type: MessageType.INFO,
              content: helpText,
              timestamp: new Date(),
            });
            return { type: 'handled' };
          }
          return { type: 'handled' };
        } else if (commandToExecute.subCommands) {
          const helpText = `Command '/${commandToExecute.name}' requires a subcommand. Available:\n${commandToExecute.subCommands
            .map((sc) => `  - ${sc.name}: ${sc.description || ''}`)
            .join('\n')}`;
          addMessage({
            type: MessageType.INFO,
            content: helpText,
            timestamp: new Date(),
          });
          return { type: 'handled' };
        }
      }
-      addMessage({
+        addMessage({
-        type: MessageType.ERROR,
+          type: MessageType.ERROR,
-        content: `Unknown command: ${trimmed}`,
+          content: `Unknown command: ${trimmed}`,
-        timestamp: new Date(),
+          timestamp: new Date(),
-      });
+        });
-      return { type: 'handled' };
+        return { type: 'handled' };
      } catch (e) {
        addItem(
          {
            type: MessageType.ERROR,
            text: e instanceof Error ? e.message : String(e),
          },
          Date.now(),
        );
        return { type: 'handled' };
      } finally {
        setIsProcessing(false);
      }
    },
    [
      config,
@ -375,6 +454,9 @@ export const useSlashCommandProcessor = (
      openPrivacyNotice,
      openEditorDialog,
      setQuittingMessages,
      setShellConfirmationRequest,
      setSessionShellAllowlist,
      setIsProcessing,
    ],
  );
@ -383,5 +465,6 @@ export const useSlashCommandProcessor = (
    slashCommands: commands,
    pendingHistoryItems,
    commandContext,
    shellConfirmationRequest,
  };
 };
--- a/packages/core/src/index.ts
+++ b/packages/core/src/index.ts
@ -35,6 +35,7 @@ export * from './utils/editor.js';
 export * from './utils/quotaErrorDetection.js';
 export * from './utils/fileUtils.js';
 export * from './utils/retry.js';
 export * from './utils/shell-utils.js';
 export * from './utils/systemEncoding.js';
 export * from './utils/textUtils.js';
 export * from './utils/formatters.js';
--- a/packages/core/src/utils/shell-utils.test.ts
+++ b/packages/core/src/utils/shell-utils.test.ts
@ -6,578 +6,272 @@
 import { expect, describe, it, beforeEach } from 'vitest';
 import {
  checkCommandPermissions,
  getCommandRoots,
  isCommandAllowed,
  stripShellWrapper,
 } from './shell-utils.js';
 import { Config } from '../config/config.js';
 let config: Config;
 beforeEach(() => {
  config = {
    getCoreTools: () => [],
    getExcludeTools: () => [],
  } as unknown as Config;
 });
 describe('isCommandAllowed', () => {
-  let config: Config;
+  it('should allow a command if no restrictions are provided', () => {
  beforeEach(() => {
    config = {
      getCoreTools: () => undefined,
      getExcludeTools: () => undefined,
    } as unknown as Config;
  });
  it('should allow a command if no restrictions are provided', async () => {
    const result = isCommandAllowed('ls -l', config);
    expect(result.allowed).toBe(true);
  });
-  it('should allow a command if it is in the allowed list', async () => {
+  it('should allow a command if it is in the global allowlist', () => {
-    config = {
+    config.getCoreTools = () => ['ShellTool(ls)'];
      getCoreTools: () => ['ShellTool(ls -l)'],
      getExcludeTools: () => undefined,
    } as unknown as Config;
    const result = isCommandAllowed('ls -l', config);
    expect(result.allowed).toBe(true);
  });
-  it('should block a command if it is not in the allowed list', async () => {
+  it('should block a command if it is not in a strict global allowlist', () => {
-    config = {
+    config.getCoreTools = () => ['ShellTool(ls -l)'];
-      getCoreTools: () => ['ShellTool(ls -l)'],
+    const result = isCommandAllowed('rm -rf /', config);
-      getExcludeTools: () => undefined,
+    expect(result.allowed).toBe(false);
-    } as unknown as Config;
+    expect(result.reason).toBe(`Command(s) not in the allowed commands list.`);
  });
  it('should block a command if it is in the blocked list', () => {
    config.getExcludeTools = () => ['ShellTool(rm -rf /)'];
    const result = isCommandAllowed('rm -rf /', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
-      "Command 'rm -rf /' is not in the allowed commands list",
+      `Command 'rm -rf /' is blocked by configuration`,
    );
  });
-  it('should block a command if it is in the blocked list', async () => {
+  it('should prioritize the blocklist over the allowlist', () => {
-    config = {
+    config.getCoreTools = () => ['ShellTool(rm -rf /)'];
-      getCoreTools: () => undefined,
+    config.getExcludeTools = () => ['ShellTool(rm -rf /)'];
      getExcludeTools: () => ['ShellTool(rm -rf /)'],
    } as unknown as Config;
    const result = isCommandAllowed('rm -rf /', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
-      "Command 'rm -rf /' is blocked by configuration",
+      `Command 'rm -rf /' is blocked by configuration`,
    );
  });
-  it('should allow a command if it is not in the blocked list', async () => {
+  it('should allow any command when a wildcard is in coreTools', () => {
-    config = {
+    config.getCoreTools = () => ['ShellTool'];
-      getCoreTools: () => undefined,
+    const result = isCommandAllowed('any random command', config);
      getExcludeTools: () => ['ShellTool(rm -rf /)'],
    } as unknown as Config;
    const result = isCommandAllowed('ls -l', config);
    expect(result.allowed).toBe(true);
  });
-  it('should block a command if it is in both the allowed and blocked lists', async () => {
+  it('should block any command when a wildcard is in excludeTools', () => {
-    config = {
+    config.getExcludeTools = () => ['run_shell_command'];
-      getCoreTools: () => ['ShellTool(rm -rf /)'],
+    const result = isCommandAllowed('any random command', config);
      getExcludeTools: () => ['ShellTool(rm -rf /)'],
    } as unknown as Config;
    const result = isCommandAllowed('rm -rf /', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
      "Command 'rm -rf /' is blocked by configuration",
    );
  });
  it('should allow any command when ShellTool is in coreTools without specific commands', async () => {
    config = {
      getCoreTools: () => ['ShellTool'],
      getExcludeTools: () => [],
    } as unknown as Config;
    const result = isCommandAllowed('any command', config);
    expect(result.allowed).toBe(true);
  });
  it('should block any command when ShellTool is in excludeTools without specific commands', async () => {
    config = {
      getCoreTools: () => [],
      getExcludeTools: () => ['ShellTool'],
    } as unknown as Config;
    const result = isCommandAllowed('any command', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
      'Shell tool is globally disabled in configuration',
    );
  });
-  it('should allow a command if it is in the allowed list using the public-facing name', async () => {
+  it('should block a command on the blocklist even with a wildcard allow', () => {
-    config = {
+    config.getCoreTools = () => ['ShellTool'];
-      getCoreTools: () => ['run_shell_command(ls -l)'],
+    config.getExcludeTools = () => ['ShellTool(rm -rf /)'];
      getExcludeTools: () => undefined,
    } as unknown as Config;
    const result = isCommandAllowed('ls -l', config);
    expect(result.allowed).toBe(true);
  });
  it('should block a command if it is in the blocked list using the public-facing name', async () => {
    config = {
      getCoreTools: () => undefined,
      getExcludeTools: () => ['run_shell_command(rm -rf /)'],
    } as unknown as Config;
    const result = isCommandAllowed('rm -rf /', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
-      "Command 'rm -rf /' is blocked by configuration",
+      `Command 'rm -rf /' is blocked by configuration`,
    );
  });
-  it('should block any command when ShellTool is in excludeTools using the public-facing name', async () => {
+  it('should allow a chained command if all parts are on the global allowlist', () => {
-    config = {
+    config.getCoreTools = () => [
-      getCoreTools: () => [],
+      'run_shell_command(echo)',
-      getExcludeTools: () => ['run_shell_command'],
+      'run_shell_command(ls)',
-    } as unknown as Config;
+    ];
    const result = isCommandAllowed('any command', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
      'Shell tool is globally disabled in configuration',
    );
  });
  it('should block any command if coreTools contains an empty ShellTool command list using the public-facing name', async () => {
    config = {
      getCoreTools: () => ['run_shell_command()'],
      getExcludeTools: () => [],
    } as unknown as Config;
    const result = isCommandAllowed('any command', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
      "Command 'any command' is not in the allowed commands list",
    );
  });
  it('should block any command if coreTools contains an empty ShellTool command list', async () => {
    config = {
      getCoreTools: () => ['ShellTool()'],
      getExcludeTools: () => [],
    } as unknown as Config;
    const result = isCommandAllowed('any command', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
      "Command 'any command' is not in the allowed commands list",
    );
  });
  it('should block a command with extra whitespace if it is in the blocked list', async () => {
    config = {
      getCoreTools: () => undefined,
      getExcludeTools: () => ['ShellTool(rm -rf /)'],
    } as unknown as Config;
    const result = isCommandAllowed(' rm  -rf  / ', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
      "Command 'rm -rf /' is blocked by configuration",
    );
  });
  it('should allow any command when ShellTool is in present with specific commands', async () => {
    config = {
      getCoreTools: () => ['ShellTool', 'ShellTool(ls)'],
      getExcludeTools: () => [],
    } as unknown as Config;
    const result = isCommandAllowed('any command', config);
    expect(result.allowed).toBe(true);
  });
  it('should block a command on the blocklist even with a wildcard allow', async () => {
    config = {
      getCoreTools: () => ['ShellTool'],
      getExcludeTools: () => ['ShellTool(rm -rf /)'],
    } as unknown as Config;
    const result = isCommandAllowed('rm -rf /', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
      "Command 'rm -rf /' is blocked by configuration",
    );
  });
  it('should allow a command that starts with an allowed command prefix', async () => {
    config = {
      getCoreTools: () => ['ShellTool(gh issue edit)'],
      getExcludeTools: () => [],
    } as unknown as Config;
    const result = isCommandAllowed(
      'gh issue edit 1 --add-label "kind/feature"',
      config,
    );
    expect(result.allowed).toBe(true);
  });
  it('should allow a command that starts with an allowed command prefix using the public-facing name', async () => {
    config = {
      getCoreTools: () => ['run_shell_command(gh issue edit)'],
      getExcludeTools: () => [],
    } as unknown as Config;
    const result = isCommandAllowed(
      'gh issue edit 1 --add-label "kind/feature"',
      config,
    );
    expect(result.allowed).toBe(true);
  });
  it('should not allow a command that starts with an allowed command prefix but is chained with another command', async () => {
    config = {
      getCoreTools: () => ['run_shell_command(gh issue edit)'],
      getExcludeTools: () => [],
    } as unknown as Config;
    const result = isCommandAllowed('gh issue edit&&rm -rf /', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
      "Command 'rm -rf /' is not in the allowed commands list",
    );
  });
  it('should not allow a command that is a prefix of an allowed command', async () => {
    config = {
      getCoreTools: () => ['run_shell_command(gh issue edit)'],
      getExcludeTools: () => [],
    } as unknown as Config;
    const result = isCommandAllowed('gh issue', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
      "Command 'gh issue' is not in the allowed commands list",
    );
  });
  it('should not allow a command that is a prefix of a blocked command', async () => {
    config = {
      getCoreTools: () => [],
      getExcludeTools: () => ['run_shell_command(gh issue edit)'],
    } as unknown as Config;
    const result = isCommandAllowed('gh issue', config);
    expect(result.allowed).toBe(true);
  });
  it('should not allow a command that is chained with a pipe', async () => {
    config = {
      getCoreTools: () => ['run_shell_command(gh issue list)'],
      getExcludeTools: () => [],
    } as unknown as Config;
    const result = isCommandAllowed('gh issue list | rm -rf /', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
      "Command 'rm -rf /' is not in the allowed commands list",
    );
  });
  it('should not allow a command that is chained with a semicolon', async () => {
    config = {
      getCoreTools: () => ['run_shell_command(gh issue list)'],
      getExcludeTools: () => [],
    } as unknown as Config;
    const result = isCommandAllowed('gh issue list; rm -rf /', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
      "Command 'rm -rf /' is not in the allowed commands list",
    );
  });
  it('should block a chained command if any part is blocked', async () => {
    config = {
      getCoreTools: () => ['run_shell_command(echo "hello")'],
      getExcludeTools: () => ['run_shell_command(rm)'],
    } as unknown as Config;
    const result = isCommandAllowed('echo "hello" && rm -rf /', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
      "Command 'rm -rf /' is blocked by configuration",
    );
  });
  it('should block a command if its prefix is on the blocklist, even if the command itself is on the allowlist', async () => {
    config = {
      getCoreTools: () => ['run_shell_command(git push)'],
      getExcludeTools: () => ['run_shell_command(git)'],
    } as unknown as Config;
    const result = isCommandAllowed('git push', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
      "Command 'git push' is blocked by configuration",
    );
  });
  it('should be case-sensitive in its matching', async () => {
    config = {
      getCoreTools: () => ['run_shell_command(echo)'],
      getExcludeTools: () => [],
    } as unknown as Config;
    const result = isCommandAllowed('ECHO "hello"', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
      'Command \'ECHO "hello"\' is not in the allowed commands list',
    );
  });
  it('should correctly handle commands with extra whitespace around chaining operators', async () => {
    config = {
      getCoreTools: () => ['run_shell_command(ls -l)'],
      getExcludeTools: () => ['run_shell_command(rm)'],
    } as unknown as Config;
    const result = isCommandAllowed('ls -l  ;  rm -rf /', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
      "Command 'rm -rf /' is blocked by configuration",
    );
  });
  it('should allow a chained command if all parts are allowed', async () => {
    config = {
      getCoreTools: () => [
        'run_shell_command(echo)',
        'run_shell_command(ls -l)',
      ],
      getExcludeTools: () => [],
    } as unknown as Config;
    const result = isCommandAllowed('echo "hello" && ls -l', config);
    expect(result.allowed).toBe(true);
  });
-  it('should block a command with command substitution using backticks', async () => {
+  it('should block a chained command if any part is blocked', () => {
-    config = {
+    config.getExcludeTools = () => ['run_shell_command(rm)'];
-      getCoreTools: () => ['run_shell_command(echo)'],
+    const result = isCommandAllowed('echo "hello" && rm -rf /', config);
      getExcludeTools: () => [],
    } as unknown as Config;
    const result = isCommandAllowed('echo `rm -rf /`', config);
    expect(result.allowed).toBe(false);
    expect(result.reason).toBe(
-      'Command substitution using $(), <(), or >() is not allowed for security reasons',
+      `Command 'rm -rf /' is blocked by configuration`,
    );
  });
-  it('should block a command with command substitution using $()', async () => {
+  describe('command substitution', () => {
-    config = {
+    it('should block command substitution using `$(...)`', () => {
-      getCoreTools: () => ['run_shell_command(echo)'],
+      const result = isCommandAllowed('echo $(rm -rf /)', config);
-      getExcludeTools: () => [],
+      expect(result.allowed).toBe(false);
-    } as unknown as Config;
+      expect(result.reason).toContain('Command substitution');
-    const result = isCommandAllowed('echo $(rm -rf /)', config);
+    });
-    expect(result.allowed).toBe(false);
+
-    expect(result.reason).toBe(
+    it('should block command substitution using `<(...)`', () => {
-      'Command substitution using $(), <(), or >() is not allowed for security reasons',
+      const result = isCommandAllowed('diff <(ls) <(ls -a)', config);
-    );
+      expect(result.allowed).toBe(false);
      expect(result.reason).toContain('Command substitution');
    });
    it('should block command substitution using backticks', () => {
      const result = isCommandAllowed('echo `rm -rf /`', config);
      expect(result.allowed).toBe(false);
      expect(result.reason).toContain('Command substitution');
    });
    it('should allow substitution-like patterns inside single quotes', () => {
      config.getCoreTools = () => ['ShellTool(echo)'];
      const result = isCommandAllowed("echo '$(pwd)'", config);
      expect(result.allowed).toBe(true);
    });
  });
 });
 describe('checkCommandPermissions', () => {
  describe('in "Default Allow" mode (no sessionAllowlist)', () => {
    it('should return a detailed success object for an allowed command', () => {
      const result = checkCommandPermissions('ls -l', config);
      expect(result).toEqual({
        allAllowed: true,
        disallowedCommands: [],
      });
    });
    it('should return a detailed failure object for a blocked command', () => {
      config.getExcludeTools = () => ['ShellTool(rm)'];
      const result = checkCommandPermissions('rm -rf /', config);
      expect(result).toEqual({
        allAllowed: false,
        disallowedCommands: ['rm -rf /'],
        blockReason: `Command 'rm -rf /' is blocked by configuration`,
        isHardDenial: true,
      });
    });
    it('should return a detailed failure object for a command not on a strict allowlist', () => {
      config.getCoreTools = () => ['ShellTool(ls)'];
      const result = checkCommandPermissions('git status && ls', config);
      expect(result).toEqual({
        allAllowed: false,
        disallowedCommands: ['git status'],
        blockReason: `Command(s) not in the allowed commands list.`,
        isHardDenial: false,
      });
    });
  });
-  it('should block a command with process substitution using <()', async () => {
+  describe('in "Default Deny" mode (with sessionAllowlist)', () => {
-    config = {
+    it('should allow a command on the sessionAllowlist', () => {
-      getCoreTools: () => ['run_shell_command(diff)'],
+      const result = checkCommandPermissions(
-      getExcludeTools: () => [],
+        'ls -l',
-    } as unknown as Config;
+        config,
-    const result = isCommandAllowed('diff <(ls) <(ls -a)', config);
+        new Set(['ls -l']),
-    expect(result.allowed).toBe(false);
+      );
-    expect(result.reason).toBe(
+      expect(result.allAllowed).toBe(true);
-      'Command substitution using $(), <(), or >() is not allowed for security reasons',
+    });
    );
  });
-  it('should allow a command with I/O redirection', async () => {
+    it('should block a command not on the sessionAllowlist or global allowlist', () => {
-    config = {
+      const result = checkCommandPermissions(
-      getCoreTools: () => ['run_shell_command(echo)'],
+        'rm -rf /',
-      getExcludeTools: () => [],
+        config,
-    } as unknown as Config;
+        new Set(['ls -l']),
-    const result = isCommandAllowed('echo "hello" > file.txt', config);
+      );
-    expect(result.allowed).toBe(true);
+      expect(result.allAllowed).toBe(false);
-  });
+      expect(result.blockReason).toContain(
        'not on the global or session allowlist',
      );
      expect(result.disallowedCommands).toEqual(['rm -rf /']);
    });
-  it('should not allow a command that is chained with a double pipe', async () => {
+    it('should allow a command on the global allowlist even if not on the session allowlist', () => {
-    config = {
+      config.getCoreTools = () => ['ShellTool(git status)'];
-      getCoreTools: () => ['run_shell_command(gh issue list)'],
+      const result = checkCommandPermissions(
-      getExcludeTools: () => [],
+        'git status',
-    } as unknown as Config;
+        config,
-    const result = isCommandAllowed('gh issue list || rm -rf /', config);
+        new Set(['ls -l']),
-    expect(result.allowed).toBe(false);
+      );
-    expect(result.reason).toBe(
+      expect(result.allAllowed).toBe(true);
-      "Command 'rm -rf /' is not in the allowed commands list",
+    });
-    );
+
    it('should allow a chained command if parts are on different allowlists', () => {
      config.getCoreTools = () => ['ShellTool(git status)'];
      const result = checkCommandPermissions(
        'git status && git commit',
        config,
        new Set(['git commit']),
      );
      expect(result.allAllowed).toBe(true);
    });
    it('should block a command on the sessionAllowlist if it is also globally blocked', () => {
      config.getExcludeTools = () => ['run_shell_command(rm)'];
      const result = checkCommandPermissions(
        'rm -rf /',
        config,
        new Set(['rm -rf /']),
      );
      expect(result.allAllowed).toBe(false);
      expect(result.blockReason).toContain('is blocked by configuration');
    });
    it('should block a chained command if one part is not on any allowlist', () => {
      config.getCoreTools = () => ['run_shell_command(echo)'];
      const result = checkCommandPermissions(
        'echo "hello" && rm -rf /',
        config,
        new Set(['echo']),
      );
      expect(result.allAllowed).toBe(false);
      expect(result.disallowedCommands).toEqual(['rm -rf /']);
    });
  });
 });
 describe('getCommandRoots', () => {
  it('should return a single command', () => {
-    const result = getCommandRoots('ls -l');
+    expect(getCommandRoots('ls -l')).toEqual(['ls']);
    expect(result).toEqual(['ls']);
  });
-  it('should return multiple commands', () => {
+  it('should handle paths and return the binary name', () => {
-    const result = getCommandRoots('ls -l | grep "test"');
+    expect(getCommandRoots('/usr/local/bin/node script.js')).toEqual(['node']);
    expect(result).toEqual(['ls', 'grep']);
  });
  it('should handle multiple commands with &&', () => {
    const result = getCommandRoots('npm run build && npm test');
    expect(result).toEqual(['npm', 'npm']);
  });
  it('should handle multiple commands with ;', () => {
    const result = getCommandRoots('echo "hello"; echo "world"');
    expect(result).toEqual(['echo', 'echo']);
  });
  it('should handle a mix of operators', () => {
    const result = getCommandRoots(
      'cat package.json | grep "version" && echo "done"',
    );
    expect(result).toEqual(['cat', 'grep', 'echo']);
  });
  it('should handle commands with paths', () => {
    const result = getCommandRoots('/usr/local/bin/node script.js');
    expect(result).toEqual(['node']);
  });
  it('should return an empty array for an empty string', () => {
-    const result = getCommandRoots('');
+    expect(getCommandRoots('')).toEqual([]);
-    expect(result).toEqual([]);
+  });
  it('should handle a mix of operators', () => {
    const result = getCommandRoots('a;b|c&&d||e&f');
    expect(result).toEqual(['a', 'b', 'c', 'd', 'e', 'f']);
  });
  it('should correctly parse a chained command with quotes', () => {
    const result = getCommandRoots('echo "hello" && git commit -m "feat"');
    expect(result).toEqual(['echo', 'git']);
  });
 });
 describe('stripShellWrapper', () => {
-  it('should strip sh -c from the beginning of the command', () => {
+  it('should strip sh -c with quotes', () => {
-    const result = stripShellWrapper('sh -c "ls -l"');
+    expect(stripShellWrapper('sh -c "ls -l"')).toEqual('ls -l');
    expect(result).toEqual('ls -l');
  });
-  it('should strip bash -c from the beginning of the command', () => {
+  it('should strip bash -c with extra whitespace', () => {
-    const result = stripShellWrapper('bash -c "ls -l"');
+    expect(stripShellWrapper('  bash  -c  "ls -l"  ')).toEqual('ls -l');
    expect(result).toEqual('ls -l');
  });
-  it('should strip zsh -c from the beginning of the command', () => {
+  it('should strip zsh -c without quotes', () => {
-    const result = stripShellWrapper('zsh -c "ls -l"');
+    expect(stripShellWrapper('zsh -c ls -l')).toEqual('ls -l');
    expect(result).toEqual('ls -l');
  });
-  it('should not strip anything if the command does not start with a shell wrapper', () => {
+  it('should strip cmd.exe /c', () => {
-    const result = stripShellWrapper('ls -l');
+    expect(stripShellWrapper('cmd.exe /c "dir"')).toEqual('dir');
    expect(result).toEqual('ls -l');
  });
-  it('should handle extra whitespace', () => {
+  it('should not strip anything if no wrapper is present', () => {
-    const result = stripShellWrapper('  sh   -c   "ls -l"  ');
+    expect(stripShellWrapper('ls -l')).toEqual('ls -l');
    expect(result).toEqual('ls -l');
  });
  it('should handle commands without quotes', () => {
    const result = stripShellWrapper('sh -c ls -l');
    expect(result).toEqual('ls -l');
  });
  it('should strip cmd.exe /c from the beginning of the command', () => {
    const result = stripShellWrapper('cmd.exe /c "dir"');
    expect(result).toEqual('dir');
  });
 });
 describe('getCommandRoots', () => {
  it('should handle multiple commands with &', () => {
    const result = getCommandRoots('echo "hello" & echo "world"');
    expect(result).toEqual(['echo', 'echo']);
  });
 });
 describe('command substitution', () => {
  let config: Config;
  beforeEach(() => {
    config = {
      getCoreTools: () => ['run_shell_command(echo)', 'run_shell_command(gh)'],
      getExcludeTools: () => [],
    } as unknown as Config;
  });
  it('should block unquoted command substitution `$(...)`', () => {
    const result = isCommandAllowed('echo $(pwd)', config);
    expect(result.allowed).toBe(false);
  });
  it('should block unquoted command substitution `<(...)`', () => {
    const result = isCommandAllowed('echo <(pwd)', config);
    expect(result.allowed).toBe(false);
  });
  it('should allow command substitution in single quotes', () => {
    const result = isCommandAllowed("echo '$(pwd)'", config);
    expect(result.allowed).toBe(true);
  });
  it('should allow backticks in single quotes', () => {
    const result = isCommandAllowed("echo '`rm -rf /`'", config);
    expect(result.allowed).toBe(true);
  });
  it('should block command substitution in double quotes', () => {
    const result = isCommandAllowed('echo "$(pwd)"', config);
    expect(result.allowed).toBe(false);
  });
  it('should allow escaped command substitution', () => {
    const result = isCommandAllowed('echo \\$(pwd)', config);
    expect(result.allowed).toBe(true);
  });
  it('should allow complex commands with quoted substitution-like patterns', () => {
    const command =
      "gh pr comment 4795 --body 'This is a test comment with $(pwd) style text'";
    const result = isCommandAllowed(command, config);
    expect(result.allowed).toBe(true);
  });
  it('should block complex commands with unquoted substitution-like patterns', () => {
    const command =
      'gh pr comment 4795 --body "This is a test comment with $(pwd) style text"';
    const result = isCommandAllowed(command, config);
    expect(result.allowed).toBe(false);
  });
  it('should allow a command with markdown content using proper quoting', () => {
    // Simple test with safe content in single quotes
    const result = isCommandAllowed(
      "gh pr comment 4795 --body 'This is safe markdown content'",
      config,
    );
    expect(result.allowed).toBe(true);
  });
 });
 describe('getCommandRoots with quote handling', () => {
  it('should correctly parse a simple command', () => {
    const result = getCommandRoots('git status');
    expect(result).toEqual(['git']);
  });
  it('should correctly parse a command with a quoted argument', () => {
    const result = getCommandRoots('git commit -m "feat: new feature"');
    expect(result).toEqual(['git']);
  });
  it('should correctly parse a command with single quotes', () => {
    const result = getCommandRoots("echo 'hello world'");
    expect(result).toEqual(['echo']);
  });
  it('should correctly parse a chained command with quotes', () => {
    const result = getCommandRoots('echo "hello" && git status');
    expect(result).toEqual(['echo', 'git']);
  });
  it('should correctly parse a complex chained command', () => {
    const result = getCommandRoots(
      'git commit -m "feat: new feature" && echo "done"',
    );
    expect(result).toEqual(['git', 'echo']);
  });
  it('should handle escaped quotes', () => {
    const result = getCommandRoots('echo "this is a "quote""');
    expect(result).toEqual(['echo']);
  });
  it('should handle commands with no spaces', () => {
    const result = getCommandRoots('command');
    expect(result).toEqual(['command']);
  });
  it('should handle multiple separators', () => {
    const result = getCommandRoots('a;b|c&&d||e&f');
    expect(result).toEqual(['a', 'b', 'c', 'd', 'e', 'f']);
  });
 });
--- a/packages/core/src/utils/shell-utils.ts
+++ b/packages/core/src/utils/shell-utils.ts
@ -179,38 +179,53 @@ export function detectCommandSubstitution(command: string): boolean {
 }
 /**
- * Determines whether a given shell command is allowed to execute based on
+ * Checks a shell command against security policies and allowlists.
- * the tool's configuration including allowlists and blocklists.
+ *
- * @param command The shell command string to validate
+ * This function operates in one of two modes depending on the presence of
- * @param config The application configuration
+ * the `sessionAllowlist` parameter:
- * @returns An object with 'allowed' boolean and optional 'reason' string if not allowed
+ *
 * 1.  **"Default Deny" Mode (sessionAllowlist is provided):** This is the
 *     strictest mode, used for user-defined scripts like custom commands.
 *     A command is only permitted if it is found on the global `coreTools`
 *     allowlist OR the provided `sessionAllowlist`. It must not be on the
 *     global `excludeTools` blocklist.
 *
 * 2.  **"Default Allow" Mode (sessionAllowlist is NOT provided):** This mode
 *     is used for direct tool invocations (e.g., by the model). If a strict
 *     global `coreTools` allowlist exists, commands must be on it. Otherwise,
 *     any command is permitted as long as it is not on the `excludeTools`
 *     blocklist.
 *
 * @param command The shell command string to validate.
 * @param config The application configuration.
 * @param sessionAllowlist A session-level list of approved commands. Its
 *   presence activates "Default Deny" mode.
 * @returns An object detailing which commands are not allowed.
 */
-export function isCommandAllowed(
+export function checkCommandPermissions(
  command: string,
  config: Config,
-): { allowed: boolean; reason?: string } {
+  sessionAllowlist?: Set<string>,
-  // 0. Disallow command substitution
+): {
-  // Parse the command to check for unquoted/unescaped command substitution
+  allAllowed: boolean;
-  const hasCommandSubstitution = detectCommandSubstitution(command);
+  disallowedCommands: string[];
-  if (hasCommandSubstitution) {
+  blockReason?: string;
  isHardDenial?: boolean;
 } {
  // Disallow command substitution for security.
  if (detectCommandSubstitution(command)) {
    return {
-      allowed: false,
+      allAllowed: false,
-      reason:
+      disallowedCommands: [command],
      blockReason:
        'Command substitution using $(), <(), or >() is not allowed for security reasons',
      isHardDenial: true,
    };
  }
  const SHELL_TOOL_NAMES = ['run_shell_command', 'ShellTool'];
  const normalize = (cmd: string): string => cmd.trim().replace(/\s+/g, ' ');
  /**
   * Checks if a command string starts with a given prefix, ensuring it's a
   * whole word match (i.e., followed by a space or it's an exact match).
   * e.g., `isPrefixedBy('npm install', 'npm')` -> true
   * e.g., `isPrefixedBy('npm', 'npm')` -> true
   * e.g., `isPrefixedBy('npminstall', 'npm')` -> false
   */
  const isPrefixedBy = (cmd: string, prefix: string): boolean => {
    if (!cmd.startsWith(prefix)) {
      return false;
@ -218,10 +233,6 @@ export function isCommandAllowed(
    return cmd.length === prefix.length || cmd[prefix.length] === ' ';
  };
  /**
   * Extracts and normalizes shell commands from a list of tool strings.
   * e.g., 'ShellTool("ls -l")' becomes 'ls -l'
   */
  const extractCommands = (tools: string[]): string[] =>
    tools.flatMap((tool) => {
      for (const toolName of SHELL_TOOL_NAMES) {
@ -234,55 +245,115 @@ export function isCommandAllowed(
  const coreTools = config.getCoreTools() || [];
  const excludeTools = config.getExcludeTools() || [];
  const commandsToValidate = splitCommands(command).map(normalize);
-  // 1. Check if the shell tool is globally disabled.
+  // 1. Blocklist Check (Highest Priority)
  if (SHELL_TOOL_NAMES.some((name) => excludeTools.includes(name))) {
    return {
-      allowed: false,
+      allAllowed: false,
-      reason: 'Shell tool is globally disabled in configuration',
+      disallowedCommands: commandsToValidate,
      blockReason: 'Shell tool is globally disabled in configuration',
      isHardDenial: true,
    };
  }
  const blockedCommands = extractCommands(excludeTools);
  for (const cmd of commandsToValidate) {
    if (blockedCommands.some((blocked) => isPrefixedBy(cmd, blocked))) {
      return {
        allAllowed: false,
        disallowedCommands: [cmd],
        blockReason: `Command '${cmd}' is blocked by configuration`,
        isHardDenial: true,
      };
    }
  }
-  const blockedCommands = new Set(extractCommands(excludeTools));
+  const globallyAllowedCommands = extractCommands(coreTools);
  const allowedCommands = new Set(extractCommands(coreTools));
  const hasSpecificAllowedCommands = allowedCommands.size > 0;
  const isWildcardAllowed = SHELL_TOOL_NAMES.some((name) =>
    coreTools.includes(name),
  );
-  const commandsToValidate = splitCommands(command).map(normalize);
+  // If there's a global wildcard, all commands are allowed at this point
  // because they have already passed the blocklist check.
  if (isWildcardAllowed) {
    return { allAllowed: true, disallowedCommands: [] };
  }
-  const blockedCommandsArr = [...blockedCommands];
+  if (sessionAllowlist) {
    // "DEFAULT DENY" MODE: A session allowlist is provided.
    // All commands must be in either the session or global allowlist.
    const disallowedCommands: string[] = [];
    for (const cmd of commandsToValidate) {
      const isSessionAllowed = [...sessionAllowlist].some((allowed) =>
        isPrefixedBy(cmd, normalize(allowed)),
      );
      if (isSessionAllowed) continue;
-  for (const cmd of commandsToValidate) {
+      const isGloballyAllowed = globallyAllowedCommands.some((allowed) =>
    // 2. Check if the command is on the blocklist.
    const isBlocked = blockedCommandsArr.some((blocked) =>
      isPrefixedBy(cmd, blocked),
    );
    if (isBlocked) {
      return {
        allowed: false,
        reason: `Command '${cmd}' is blocked by configuration`,
      };
    }
    // 3. If in strict allow-list mode, check if the command is permitted.
    const isStrictAllowlist = hasSpecificAllowedCommands && !isWildcardAllowed;
    const allowedCommandsArr = [...allowedCommands];
    if (isStrictAllowlist) {
      const isAllowed = allowedCommandsArr.some((allowed) =>
        isPrefixedBy(cmd, allowed),
      );
-      if (!isAllowed) {
+      if (isGloballyAllowed) continue;
      disallowedCommands.push(cmd);
    }
    if (disallowedCommands.length > 0) {
      return {
        allAllowed: false,
        disallowedCommands,
        blockReason: `Command(s) not on the global or session allowlist.`,
        isHardDenial: false, // This is a soft denial; confirmation is possible.
      };
    }
  } else {
    // "DEFAULT ALLOW" MODE: No session allowlist.
    const hasSpecificAllowedCommands = globallyAllowedCommands.length > 0;
    if (hasSpecificAllowedCommands) {
      const disallowedCommands: string[] = [];
      for (const cmd of commandsToValidate) {
        const isGloballyAllowed = globallyAllowedCommands.some((allowed) =>
          isPrefixedBy(cmd, allowed),
        );
        if (!isGloballyAllowed) {
          disallowedCommands.push(cmd);
        }
      }
      if (disallowedCommands.length > 0) {
        return {
-          allowed: false,
+          allAllowed: false,
-          reason: `Command '${cmd}' is not in the allowed commands list`,
+          disallowedCommands,
          blockReason: `Command(s) not in the allowed commands list.`,
          isHardDenial: false, // This is a soft denial.
        };
      }
    }
    // If no specific global allowlist exists, and it passed the blocklist,
    // the command is allowed by default.
  }
-  // 4. If all checks pass, the command is allowed.
+  // If all checks for the current mode pass, the command is allowed.
-  return { allowed: true };
+  return { allAllowed: true, disallowedCommands: [] };
 }
 /**
 * Determines whether a given shell command is allowed to execute based on
 * the tool's configuration including allowlists and blocklists.
 *
 * This function operates in "default allow" mode. It is a wrapper around
 * `checkCommandPermissions`.
 *
 * @param command The shell command string to validate.
 * @param config The application configuration.
 * @returns An object with 'allowed' boolean and optional 'reason' string if not allowed.
 */
 export function isCommandAllowed(
  command: string,
  config: Config,
 ): { allowed: boolean; reason?: string } {
  // By not providing a sessionAllowlist, we invoke "default allow" behavior.
  const { allAllowed, blockReason } = checkCommandPermissions(command, config);
  if (allAllowed) {
    return { allowed: true };
  }
  return { allowed: false, reason: blockReason };
 }