chore: Update utils.py support chaining (#3261)

fengju0213 · Wendong-Fan · web-flow · commit ee7b2ad092d1 · 2025-10-12T01:23:39.000+08:00
Co-authored-by: Wendong-Fan &lt;133094783+Wendong-Fan@users.noreply.github.com&gt;
Co-authored-by: Wendong-Fan &lt;w3ndong.fan@gmail.com&gt;
diff --git a/.github/ISSUE_TEMPLATE/bug_report.yml b/.github/ISSUE_TEMPLATE/bug_report.yml
@@ -26,7 +26,7 @@ body:
     attributes:
       label: What version of camel are you using?
       description: Run command `python3 -c 'print(__import__("camel").__version__)'` in your shell and paste the output here.
-      placeholder: E.g., 0.2.76a14
+      placeholder: E.g., 0.2.76
     validations:
       required: true
 
diff --git a/.gitignore b/.gitignore
@@ -415,6 +415,7 @@ tags
 
 # Camel
 logs/
+tool_cache/
 
 # Download Configuration
 cookies.txt
diff --git a/camel/__init__.py b/camel/__init__.py
@@ -14,7 +14,7 @@
 
 from camel.logger import disable_logging, enable_logging, set_log_level
 
-__version__ = '0.2.76a14'
+__version__ = '0.2.76'
 
 __all__ = [
     '__version__',
diff --git a/camel/data_collectors/alpaca_collector.py b/camel/data_collectors/alpaca_collector.py
@@ -70,16 +70,25 @@ def convert(self) -> Dict[str, Any]:
         if not history:
             raise ValueError("No data collected.")
 
-        # Validate and process history
-        if len(history) == 3 and history[0].role == "system":
-            history = history[1:]  # Ignore the system message.
-        elif len(history) != 2:
+        # Filter out system and tool-related messages
+        # Keep only user and final assistant messages
+        filtered_history = []
+        for msg in history:
+            if msg.role == "user":
+                filtered_history.append(msg)
+            elif msg.role == "assistant" and msg.message:
+                # Keep assistant messages with actual content
+                # (skip empty ones that only contain tool calls)
+                filtered_history.append(msg)
+
+        # Validate filtered history
+        if len(filtered_history) != 2:
             raise ValueError(
                 f"AlpacaDataCollector only supports one message pair, but "
-                f"got {len(history)}"
+                f"got {len(filtered_history)} after filtering tool messages"
             )
 
-        input_message, output_message = history
+        input_message, output_message = filtered_history
         instruction = (
             self.system_message.content if self.system_message else ""
         ) + str(input_message.message)
diff --git a/camel/toolkits/terminal_toolkit/utils.py b/camel/toolkits/terminal_toolkit/utils.py
@@ -15,7 +15,6 @@
 import os
 import platform
 import re
-import shlex
 import shutil
 import subprocess
 import sys
@@ -27,38 +26,99 @@
 logger = get_logger(__name__)
 
 
-def contains_command_chaining(command: str) -> bool:
-    r"""Check if command contains chaining operators that could be used to
-    bypass security.
+def check_command_safety(
+    command: str,
+    allowed_commands: Optional[Set[str]] = None,
+) -> Tuple[bool, str]:
+    r"""Check if a command (potentially with chaining) is safe to execute.
+
+    Args:
+        command (str): The command string to check
+        allowed_commands (Optional[Set[str]]): Set of allowed commands
+            (whitelist mode)
+
+    Returns:
+        Tuple[bool, str]: (is_safe, reason)
     """
-    # Pattern to match command chaining operators: ;, &&, ||, |
-    # But exclude cases where they are inside quotes or escaped
-    chaining_pattern = r'''
-        (?<!\\)      # Not preceded by backslash (not escaped)
-        (?:          # Group for alternation
-            ;        # Semicolon
-            |        # OR
-            \|\|     # Logical OR
-            |        # OR  
-            &&       # Logical AND
-            |        # OR
-            (?<!\|)  # Not preceded by pipe (to avoid matching ||)
-            \|       # Single pipe
-            (?!\|)   # Not followed by pipe (to avoid matching ||)
-        )
-        (?=          # Positive lookahead
-            (?:      # Group
-                [^"'] # Not a quote
-                |     # OR
-                "[^"]*" # Content in double quotes
-                |     # OR
-                '[^']*' # Content in single quotes
-            )*       # Zero or more times
-            $        # End of string
-        )
-    '''
+    if not command.strip():
+        return False, "Empty command is not allowed."
 
-    return bool(re.search(chaining_pattern, command, re.VERBOSE))
+    # Dangerous commands list - including ALL rm operations
+    dangerous_commands = [
+        # System administration
+        'sudo',
+        'su',
+        'reboot',
+        'shutdown',
+        'halt',
+        'poweroff',
+        'init',
+        # File system manipulation
+        'rm',
+        'chown',
+        'chgrp',
+        'umount',
+        'mount',
+        # Disk operations
+        'dd',
+        'mkfs',
+        'fdisk',
+        'parted',
+        'fsck',
+        'mkswap',
+        'swapon',
+        'swapoff',
+        # Process management
+        'service',
+        'systemctl',
+        'systemd',
+        # Network configuration
+        'iptables',
+        'ip6tables',
+        'ifconfig',
+        'route',
+        'iptables-save',
+        # Cron and scheduling
+        'crontab',
+        'at',
+        'batch',
+        # User management
+        'useradd',
+        'userdel',
+        'usermod',
+        'passwd',
+        'chpasswd',
+        'newgrp',
+        # Kernel modules
+        'modprobe',
+        'rmmod',
+        'insmod',
+        'lsmod',
+    ]
+
+    # Remove quoted strings to avoid false positives
+    clean_command = re.sub(r'''["'][^"']*["']''', ' ', command)
+
+    # If whitelist mode, check ALL commands against the whitelist
+    if allowed_commands is not None:
+        # Extract all command words (at start or after operators)
+        cmd_pattern = r'(?:^|;|\||&&)\s*\b([a-zA-Z_/][\w\-/]*)'
+        found_commands = re.findall(cmd_pattern, clean_command, re.IGNORECASE)
+        for cmd in found_commands:
+            if cmd.lower() not in allowed_commands:
+                return (
+                    False,
+                    f"Command '{cmd}' is not in the allowed commands list.",
+                )
+        return True, ""
+
+    # Check for dangerous commands
+    for cmd in dangerous_commands:
+        pattern = rf'(?:^|;|\||&&)\s*\b{re.escape(cmd)}\b'
+        if re.search(pattern, clean_command, re.IGNORECASE):
+            return False, f"Command '{cmd}' is blocked for safety."
+
+    return True, ""
 
 
 def sanitize_command(
@@ -80,133 +140,25 @@ def sanitize_command(
     Returns:
         Tuple[bool, str]: (is_safe, message_or_command)
     """
-    # Apply security checks to both backends - security should be consistent
     if not safe_mode:
         return True, command  # Skip all checks if safe_mode is disabled
 
-    # First check for command chaining and pipes
-    if contains_command_chaining(command):
-        return (
-            False,
-            "Command chaining (;, &&, ||, |) is not allowed "
-            "for security reasons.",
-        )
-
-    parts = shlex.split(command)
-    if not parts:
-        return False, "Empty command is not allowed."
-    base_cmd = parts[0].lower()
-
-    # If whitelist is defined, only allow whitelisted commands
-    if allowed_commands is not None:
-        if base_cmd not in allowed_commands:
-            return (
-                False,
-                f"Command '{base_cmd}' is not in the allowed commands list.",
+    # Use safety checker
+    is_safe, reason = check_command_safety(command, allowed_commands)
+    if not is_safe:
+        return False, reason
+
+    # Additional check for Docker backend: prevent cd outside working directory
+    if not use_docker_backend and working_dir and 'cd ' in command:
+        # Extract cd commands and check their targets
+        cd_pattern = r'\bcd\s+([^\s;|&]+)'
+        for match in re.finditer(cd_pattern, command):
+            target_path = match.group(1).strip('\'"')
+            target_dir = os.path.abspath(
+                os.path.join(working_dir, target_path)
             )
-        # If command is whitelisted, skip the dangerous commands check
-        # but still apply other safety checks
-    else:
-        # Block dangerous commands (only when no whitelist is defined)
-        dangerous_commands = [
-            # System administration
-            'sudo',
-            'su',
-            'reboot',
-            'shutdown',
-            'halt',
-            'poweroff',
-            'init',
-            # File system manipulation
-            'rm',
-            'mv',
-            'chmod',
-            'chown',
-            'chgrp',
-            'umount',
-            'mount',
-            # Disk operations
-            'dd',
-            'mkfs',
-            'fdisk',
-            'parted',
-            'fsck',
-            'mkswap',
-            'swapon',
-            'swapoff',
-            # Process management
-            'kill',
-            'killall',
-            'pkill',
-            'service',
-            'systemctl',
-            'systemd',
-            # Network configuration
-            'iptables',
-            'ip6tables',
-            'ifconfig',
-            'route',
-            'iptables-save',
-            # Cron and scheduling
-            'crontab',
-            'at',
-            'batch',
-            # User management
-            'useradd',
-            'userdel',
-            'usermod',
-            'passwd',
-            'chpasswd',
-            'newgrp',
-            # Kernel modules
-            'modprobe',
-            'rmmod',
-            'insmod',
-            'lsmod',
-            # System information that could leak sensitive data
-            'dmesg',
-            'last',
-            'lastlog',
-            'who',
-            'w',
-        ]
-        if base_cmd in dangerous_commands:
-            # Special handling for rm command - use regex for precise checking
-            if base_cmd == 'rm':
-                # Check for dangerous rm options using regex
-                dangerous_rm_pattern = (
-                    r'\s-[^-\s]*[rf][^-\s]*\s|\s--force\s|'
-                    r'\s--recursive\s|\s-rf\s|\s-fr\s'
-                )
-                if re.search(dangerous_rm_pattern, command, re.IGNORECASE):
-                    return (
-                        False,
-                        f"Command '{base_cmd}' with forceful or "
-                        f"recursive options is blocked for safety.",
-                    )
-                # Also block rm without any target (could be dangerous)
-                if len(parts) < 2:
-                    return (
-                        False,
-                        "rm command requires target "
-                        "file/directory specification.",
-                    )
-            else:
-                return False, f"Command '{base_cmd}' is blocked for safety."
-
-    # For local backend only: prevent changing
-    # directory outside the workspace
-    # Docker containers are already sandboxed,
-    # so this check is not needed there
-    if (
-        not use_docker_backend
-        and base_cmd == 'cd'
-        and len(parts) > 1
-        and working_dir
-    ):
-        target_dir = os.path.abspath(os.path.join(working_dir, parts[1]))
-        if not target_dir.startswith(working_dir):
-            return False, "Cannot 'cd' outside of the working directory."
+            if not target_dir.startswith(working_dir):
+                return False, "Cannot 'cd' outside of the working directory."
 
     return True, command
 
diff --git a/docs/conf.py b/docs/conf.py
@@ -27,7 +27,7 @@
 project = 'CAMEL'
 copyright = '2024, CAMEL-AI.org'
 author = 'CAMEL-AI.org'
-release = '0.2.76a14'
+release = '0.2.76'
 
 html_favicon = (
     'https://raw.githubusercontent.com/camel-ai/camel/master/misc/favicon.png'
diff --git a/pyproject.toml b/pyproject.toml
@@ -4,7 +4,7 @@ build-backend = "hatchling.build"
 
 [project]
 name = "camel-ai"
-version = "0.2.76a14"
+version = "0.2.76"
 description = "Communicative Agents for AI Society Study"
 authors = [{ name = "CAMEL-AI.org" }]
 requires-python = ">=3.10,<3.13"
diff --git a/test/agents/test_chat_agent.py b/test/agents/test_chat_agent.py
@@ -880,6 +880,7 @@ def test_tool_calling_sync(step_call_count=3):
         system_message=system_message,
         model=model,
         tools=MathToolkit().get_tools(),
+        enable_tool_output_cache=False,
     )
 
     ref_funcs = MathToolkit().get_tools()
@@ -1052,6 +1053,7 @@ async def test_tool_calling_math_async(step_call_count=3):
         system_message=system_message,
         model=model,
         tools=math_funcs,
+        enable_tool_output_cache=False,
     )
 
     ref_funcs = math_funcs
@@ -1213,6 +1215,7 @@ def mock_run_tool_calling_async(*args, **kwargs):
         system_message=system_message,
         model=model,
         tools=[FunctionTool(async_sleep)],
+        enable_tool_output_cache=False,
     )
 
     assert len(agent.tool_dict) == 1
diff --git a/test/test_chat_agent_tool_cache.py b/test/test_chat_agent_tool_cache.py
diff --git a/uv.lock b/uv.lock

Original file line number	Diff line number	Diff line change
`@@ -880,6 +880,7 @@ def test_tool_calling_sync(step_call_count=3):`
`880`	`880`	`system_message=system_message,`
`881`	`881`	`model=model,`
`882`	`882`	`tools=MathToolkit().get_tools(),`
	`883`	`+ enable_tool_output_cache=False,`
`883`	`884`	`)`
`884`	`885`
`885`	`886`	`ref_funcs = MathToolkit().get_tools()`
`@@ -1052,6 +1053,7 @@ async def test_tool_calling_math_async(step_call_count=3):`
`1052`	`1053`	`system_message=system_message,`
`1053`	`1054`	`model=model,`
`1054`	`1055`	`tools=math_funcs,`
	`1056`	`+ enable_tool_output_cache=False,`
`1055`	`1057`	`)`
`1056`	`1058`
`1057`	`1059`	`ref_funcs = math_funcs`
`@@ -1213,6 +1215,7 @@ def mock_run_tool_calling_async(args, *kwargs):`
`1213`	`1215`	`system_message=system_message,`
`1214`	`1216`	`model=model,`
`1215`	`1217`	`tools=[FunctionTool(async_sleep)],`
	`1218`	`+ enable_tool_output_cache=False,`
`1216`	`1219`	`)`
`1217`	`1220`
`1218`	`1221`	`assert len(agent.tool_dict) == 1`