inclusionAI · JacksonMei · Mar 4, 2026 · Mar 2, 2026 · Mar 2, 2026 · Mar 2, 2026
diff --git a/aenv/pyproject.toml b/aenv/pyproject.toml
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 
 [project]
 name = "aenvironment"
-version = "0.1.4"
+version = "0.1.5"
 description = "AEnvironment Python SDK - Production-grade environment for AI agent tools"
 readme = "README.md"
 requires-python = ">=3.10"

diff --git a/aenv/src/aenv/__init__.py b/aenv/src/aenv/__init__.py
@@ -26,10 +26,11 @@
     register_health,
     register_reward,
 )
+from aenv.core.logging import setup_logging
 from aenv.core.models import EnvInstance, EnvStatus
 from aenv.core.tool import Tool, get_registry, register_tool
 
-__version__ = "0.1.0"
+__version__ = "0.1.5"
 __all__ = [
     "Tool",
     "register_tool",
@@ -43,4 +44,5 @@
     "EnvironmentError",
     "EnvInstance",
     "EnvStatus",
+    "setup_logging",
 ]
diff --git a/aenv/src/aenv/client/scheduler_client.py b/aenv/src/aenv/client/scheduler_client.py
@@ -111,6 +111,7 @@ async def create_env_instance(
         environment_variables: Optional[Dict[str, str]] = None,
         arguments: Optional[List[str]] = None,
         owner: Optional[str] = None,
+        labels: Optional[Dict[str, str]] = None,
     ) -> EnvInstance:
         """
         Create a new environment instance.
@@ -122,6 +123,7 @@ async def create_env_instance(
             arguments: Optional arguments
             ttl: Time to live for instance
             owner: Optional owner of the instance
+            labels: Optional labels for the instance
         Returns:
             Created EnvInstance
 
@@ -133,7 +135,7 @@ async def create_env_instance(
             raise NetworkError("Client not connected")
 
         logger.info(
-            f"Creating environment instance: {name}, datasource: {datasource}, ttl: {ttl}, environment_variables: {environment_variables}, arguments: {arguments}, owner: {owner}, url: {self.base_url}"
+            f"Creating environment instance: {name}, datasource: {datasource}, ttl: {ttl}, environment_variables: {environment_variables}, arguments: {arguments}, owner: {owner}, labels: {labels}, url: {self.base_url}"
         )
         request = EnvInstanceCreateRequest(
             envName=name,
@@ -142,6 +144,7 @@ async def create_env_instance(
             arguments=arguments,
             ttl=ttl,
             owner=owner,
+            labels=labels,
         )
 
         for attempt in range(self.max_retries + 1):

diff --git a/aenv/src/aenv/core/environment.py b/aenv/src/aenv/core/environment.py
@@ -117,6 +117,7 @@ def __init__(
         api_key: Optional[str] = None,
         skip_for_healthy: bool = False,
         owner: Optional[str] = None,
+        labels: Optional[Dict[str, str]] = None,
     ):
         """
         Initialize environment.
@@ -141,6 +142,7 @@ def __init__(
         self.dummy_instance_ip = os.getenv("DUMMY_INSTANCE_IP")
         self.skip_for_healthy = skip_for_healthy
         self.owner = owner
+        self.labels = labels
 
         if not aenv_url:
             aenv_url = self.dummy_instance_ip or os.getenv(
@@ -163,6 +165,7 @@ def __init__(
         self._initialized = False
         self._client: Optional[AEnvSchedulerClient] = None
         self._mcp_client: Optional[Client] = None
+        self._mcp_session_active: bool = False
 
     def _log_prefix(self) -> str:
         """Get log prefix with instance ID."""
@@ -257,6 +260,7 @@ async def release(self):
                 )
             finally:
                 self._mcp_client = None
+                self._mcp_session_active = False
 
         if self._client:
             if self._instance and not self.dummy_instance_ip:
@@ -298,23 +302,22 @@ async def list_tools(self) -> List[Dict[str, Any]]:
         await self._ensure_initialized()
 
         try:
-            client = await self._get_mcp_client()
-            async with client:
-                tools = await client.list_tools()
-                logger.info(
-                    f"{self._log_prefix()} Found {len(tools)} tools in environment {self.env_name}"
-                )
+            client = await self._ensure_mcp_session()
+            tools = await client.list_tools()
+            logger.info(
+                f"{self._log_prefix()} Found {len(tools)} tools in environment {self.env_name}"
+            )
 
-                formatted_tools = [
-                    {
-                        "name": f"{self.env_name}/{tool.name}",
-                        "description": tool.description,
-                        "inputSchema": tool.inputSchema,
-                    }
-                    for tool in tools
-                ]
+            formatted_tools = [
+                {
+                    "name": f"{self.env_name}/{tool.name}",
+                    "description": tool.description,
+                    "inputSchema": tool.inputSchema,
+                }
+                for tool in tools
+            ]
 
-                return formatted_tools
+            return formatted_tools
         except Exception as e:
             logger.error(
                 f"{self._log_prefix()} Failed to list tools for {self.env_name}: {str(e)} | "
@@ -459,6 +462,7 @@ async def _call_function(
         method: str = "POST",
         timeout: Optional[float] = None,
         ensure_initialized: bool = True,
+        quiet: bool = False,
     ) -> Dict[str, Any]:
         """
         Execute a registered function via HTTP endpoint.
@@ -467,6 +471,7 @@ async def _call_function(
             function_url: url of the registered function
             arguments: Arguments to pass to the function
             timeout: Override default timeout
+            quiet: If True, log at debug level instead of error on transient issues
 
         Returns:
             Function execution result
@@ -538,28 +543,30 @@ async def _call_function(
             if server_error:
                 error_msg = f"{error_msg} | Server error: {server_error}"
 
-            logger.error(
-                f"{self._log_prefix()} Function '{function_url}' execution http request failed: {error_msg} | "
+            _log = logger.debug if quiet else logger.error
+            _log(
+                f"{self._log_prefix()} Function '{function_url}' execution http request not ready: {error_msg} | "
                 f"Type: {type(e).__name__} | "
                 f"Environment: {self.env_name} | "
                 f"Arguments: {arguments} | "
                 f"Timeout: {timeout or self.timeout}s | "
                 f"Function URL: {function_url}"
             )
             raise EnvironmentError(
-                f"Function '{function_url}' execution failed: {error_msg}"
+                f"Function '{function_url}' execution not ready: {error_msg}"
             )
         except Exception as e:
-            logger.error(
-                f"{self._log_prefix()} Function '{function_url}' execution failed: {str(e)} | "
+            _log = logger.debug if quiet else logger.error
+            _log(
+                f"{self._log_prefix()} Function '{function_url}' execution encountered an issue: {str(e)} | "
                 f"Type: {type(e).__name__} | "
                 f"Environment: {self.env_name} | "
                 f"Arguments: {arguments} | "
                 f"Timeout: {timeout or self.timeout}s | "
                 f"Function URL: {function_url}"
             )
             raise EnvironmentError(
-                f"Function '{function_url}' execution failed: {str(e)}"
+                f"Function '{function_url}' execution encountered an issue: {str(e)}"
             )
 
     async def check_health(
@@ -639,40 +646,41 @@ async def call_tool(
             actual_tool_name = tool_name
 
         logger.info(
-            f"{self._log_prefix()} Executing tool: {actual_tool_name} in environment {self.env_name}"
+            f"{self._log_prefix()} Executing tool: {actual_tool_name} in environment {self.env_name}, arguments={arguments}"
         )
 
         try:
-            client = await self._get_mcp_client()
-            async with client:
-                result = await client.call_tool_mcp(
-                    name=actual_tool_name, arguments=arguments, timeout=timeout
-                )
+            client = await self._ensure_mcp_session()
+            result = await client.call_tool_mcp(
+                name=actual_tool_name, arguments=arguments, timeout=timeout
+            )
 
-                # Convert FastMCP result to ToolResult
-                content = []
-                if result.content:
-                    for item in result.content:
-                        if hasattr(item, "text") and item.text:
-                            content.append({"type": "text", "text": item.text})
-                        elif hasattr(item, "type") and hasattr(item, "data"):
-                            content.append({"type": item.type, "data": item.data})
-                        else:
-                            content.append({"type": "text", "text": str(item)})
+            # Convert FastMCP result to ToolResult
+            content = []
+            if result.content:
+                for item in result.content:
+                    if hasattr(item, "text") and item.text:
+                        content.append({"type": "text", "text": item.text})
+                    elif hasattr(item, "type") and hasattr(item, "data"):
+                        content.append({"type": item.type, "data": item.data})
+                    else:
+                        content.append({"type": "text", "text": str(item)})
 
-                return ToolResult(content=content, is_error=result.isError)
+            return ToolResult(content=content, is_error=result.isError)
 
         except Exception as e:
             logger.error(
-                f"{self._log_prefix()} Tool execution failed: {str(e)} | "
+                f"{self._log_prefix()} Tool execution encountered an issue: {str(e)} | "
                 f"Type: {type(e).__name__} | "
                 f"Environment: {self.env_name} | "
                 f"Tool: {actual_tool_name} | "
                 f"Arguments: {arguments} | "
                 f"Timeout: {timeout or self.timeout}s | "
                 f"MCP URL: {self.aenv_data_url}"
             )
-            raise ToolError(f"Tool '{actual_tool_name}' execution failed: {str(e)}")
+            raise ToolError(
+                f"Tool '{actual_tool_name}' execution encountered an issue: {str(e)}"
+            )
 
     async def get_env_info(self) -> Dict[str, Any]:
         """Get environment information."""
@@ -734,6 +742,7 @@ async def _wait_for_healthy(self, timeout: float = 300.0) -> None:
                         timeout=3.0,
                         method="GET",
                         ensure_initialized=False,
+                        quiet=True,
                     )
 
                     logger.debug(
@@ -751,7 +760,7 @@ async def _wait_for_healthy(self, timeout: float = 300.0) -> None:
 
                 except Exception as e:
                     logger.debug(
-                        f"{self._log_prefix()} Health check failed: {str(e)}, retrying..."
+                        f"{self._log_prefix()} Health check attempt {times + 1}: {str(e)}, retrying..."
                     )
 
                 if asyncio.get_event_loop().time() - start_time > timeout:
@@ -829,6 +838,7 @@ async def _create_env_instance(self):
                 arguments=self.arguments,
                 ttl=self.ttl,
                 owner=self.owner,
+                labels=self.labels,
             )
             logger.info(
                 f"{self._log_prefix()} Environment instance created with ID: {self._instance.id}"
@@ -908,3 +918,60 @@ async def _get_mcp_client(self) -> Client:
                 f"Timeout: {self.timeout}s "
             )
             raise EnvironmentError(f"Failed to create MCP client: {str(e)}")
+
+    async def _ensure_mcp_session(self) -> Client:
+        """
+        Ensure MCP client exists and its session is active.
+
+        Lazily creates the Client and enters its async context (establishing
+        the MCP session) on first call. Subsequent calls return the same
+        connected client. The session is only torn down in release().
+
+        Returns:
+            Connected Client with an active MCP session.
+        """
+        # Fast path: session already active and connected
+        if self._mcp_session_active and self._mcp_client is not None:
+            if self._mcp_client.is_connected():
+                return self._mcp_client
+            # Session died unexpectedly; will reconnect below
+            logger.warning(f"{self._log_prefix()} MCP session lost, reconnecting...")
+            self._mcp_session_active = False
+
+        # Lazy-init the lock
+        if not hasattr(self, "_mcp_session_lock"):
+            self._mcp_session_lock = asyncio.Lock()
+
+        async with self._mcp_session_lock:
+            # Double-check after acquiring lock
+            if self._mcp_session_active and self._mcp_client is not None:
+                if self._mcp_client.is_connected():
+                    return self._mcp_client
+                self._mcp_session_active = False
+
+            # Close stale client if any
+            if self._mcp_client is not None:
+                try:
+                    await self._mcp_client.close()
+                except Exception as e:
+                    logger.debug(
+                        f"{self._log_prefix()} Error closing stale MCP client: {e}"
+                    )
+                self._mcp_client = None
+
+            # Create fresh client and establish session
+            client = await self._get_mcp_client()
+            try:
+                await client.__aenter__()
+                self._mcp_session_active = True
+                logger.info(
+                    f"{self._log_prefix()} MCP session established and will be reused"
+                )
+                return client
+            except Exception as e:
+                self._mcp_client = None
+                self._mcp_session_active = False
+                logger.error(
+                    f"{self._log_prefix()} Failed to establish MCP session: {e}"
+                )
+                raise EnvironmentError(f"Failed to establish MCP session: {e}") from e