Support authoring ADK agents using processors.

kibergus · kibergus · commit 9a5e34d54641 · 2025-10-20T16:45:58.000+01:00
PiperOrigin-RevId: 816684684
diff --git a/examples/live/commentator_adk/agent.py b/examples/live/commentator_adk/agent.py
@@ -0,0 +1,52 @@
+# Copyright 2025 DeepMind Technologies Limited. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+r"""Live commentator ADK agent based on GenAI Processors.
+
+## Setup
+
+To install the dependencies for this script, run:
+
+```
+pip install genai-processors google-adk
+```
+
+Before running this script, ensure the `GOOGLE_API_KEY` environment
+variable is set to the api-key you obtained from Google AI Studio.
+
+## Run
+
+Change directory to the parent folder (genai-processors/examples/live) and run
+`adk web`. then navigate to http://localhost:8000/ select "commentator_adk"
+agent and click on the "Use camera" button.
+
+To restart a session click on the "New session" button and reload the page.
+"""
+
+import os
+
+from genai_processors.core import adk
+import commentator
+
+
+# You need to define the API key in the environment variables.
+# export GOOGLE_API_KEY=...
+API_KEY = os.environ['GOOGLE_API_KEY']
+
+
+root_agent = adk.ProcessorAgent(
+    (lambda: commentator.create_live_commentator(API_KEY)),
+    name='commentator_adk',
+)
diff --git a/examples/trip_request_adk/agent.py b/examples/trip_request_adk/agent.py
@@ -0,0 +1,175 @@
+# Copyright 2025 DeepMind Technologies Limited. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+r"""ADK agent version of the trip request planner.
+
+We use Gemini flash-lite to formalize freeform trip request into the dates and
+destination. Then we use a second model to compose the trip itinerary.
+
+This simple example shows how we can reduce perceived latency by running a fast
+model to validate and acknowledge user request while the good but slow model is
+handling it.
+
+The approach from this example also can be used as a defense mechanism against
+prompt injections. The first model without tool access formalizes the request
+into the TripRequest dataclass. The attack surface is significantly reduced by
+the narrowness of the output format and lack of tools. Then a second model is
+run on this cleanup up input.
+
+## Setup
+
+To install the dependencies for this script, run:
+
+```
+pip install genai-processors google-adk
+```
+
+Before running this script, ensure the `GOOGLE_API_KEY` environment
+variable is set to the api-key you obtained from Google AI Studio.
+
+## Run
+
+Change directory to `genai-processors/examples` and run `adk web`.
+Then navigate to http://localhost:8000/ select "trip_request_adk"
+agent and enter your trip request.
+"""
+
+from collections.abc import AsyncIterable
+import datetime
+import os
+
+import dataclasses_json
+from genai_processors import content_api
+from genai_processors import processor
+from genai_processors import switch
+from genai_processors.core import adk
+from genai_processors.core import genai_model
+from genai_processors.core import preamble
+from google.genai import types as genai_types
+from pydantic import dataclasses
+
+# You need to define the API key in the environment variables.
+API_KEY = os.environ['GOOGLE_API_KEY']
+
+
+@dataclasses_json.dataclass_json
+@dataclasses.dataclass(frozen=True)
+class TripRequest:
+  """A trip request required for GenAI models to generate structured output."""
+
+  start_date: str
+  end_date: str
+  destination: str
+  error: str
+
+  def info(self) -> str:
+    """Returns a string representation to be used in prompts."""
+    return (
+        '\nTrip information:\n'
+        f'Start date: {self.start_date}\n'
+        f'End date: {self.end_date}\n'
+        f'Destination: {self.destination}\n'
+    )
+
+
+# A processor can be easily defined as a function with a dedicated decorator.
+# This is the recommended way to define stateless processors.
+@processor.part_processor_function
+async def process_json_output(
+    part: content_api.ProcessorPart,
+) -> AsyncIterable[content_api.ProcessorPart]:
+  """Process the json output of a GenAI model."""
+  trip_request = part.get_dataclass(TripRequest)
+  if trip_request.error:
+    yield content_api.ProcessorPart(
+        trip_request.error,
+        substream_name='error',
+    )
+  else:
+    yield content_api.ProcessorPart(trip_request.info())
+
+
+def create_trip_request_processor() -> processor.Processor:
+  """Creates a trip request processor."""
+  # First processor extracts a json trip request from the user input.
+  # We need a json dataclass (we use the wrapper from pydantic) to parse the
+  # json output of the model. We add the current date to the prompt to make
+  # sure the model uses the current date.
+  extract_trip_request = preamble.Suffix(
+      content_factory=lambda: f'Today is: {datetime.date.today()}'
+  ) + genai_model.GenaiModel(
+      api_key=API_KEY,
+      model_name='gemini-2.0-flash-lite',
+      generate_content_config=genai_types.GenerateContentConfig(
+          system_instruction=(
+              'You are a travel agent. You are given a trip request from a'
+              ' user. You need to check if the user provided all necessary'
+              ' information. If the user request is missing any'
+              ' information, you need to return an error message. If the'
+              ' user request is complete, you need to return the user'
+              ' request with the start date, end date and the destination.'
+          ),
+          response_schema=TripRequest,
+          response_mime_type='application/json',
+      ),
+  )
+  # Second processor generates a trip itinerary based on a valid trip request.
+  generate_trip = genai_model.GenaiModel(
+      api_key=API_KEY,
+      # NOTE: To reduce cost of running the demo we use the flash model.
+      # The real application would use a better but slower thinking model.
+      # The perceived latency of that model would be hidden by the fast answer
+      # from extract_trip_request and acknowledging to the user that we've
+      # started planning the trip.
+      model_name='gemini-2.0-flash-lite',
+      generate_content_config=genai_types.GenerateContentConfig(
+          system_instruction=(
+              'You are a travel agent. You are given a trip request from a user'
+              ' with dates and destination. Plan a trip with hotels and'
+              ' activities. Split the plan into daily section. Plan one'
+              ' activity per 1/2 day max.'
+          ),
+          # Ground with Google Search
+          tools=[genai_types.Tool(google_search=genai_types.GoogleSearch())],
+      ),
+  )
+
+  # Returns a preamble part with a message to the user.
+  msg_to_user = preamble.Preamble(
+      content='OK, preparing a trip for the following request:\n',
+  )
+
+  # Plumb everything together with a logical switch that lets us handle errors.
+  return (
+      extract_trip_request
+      + process_json_output
+      + switch.Switch(content_api.get_substream_name).case(
+          # default substream name, no error.
+          '',
+          # For processors, the `parallel_concat` is a way to run them
+          # concurrently while specify how their results should be merged, here
+          # they should be concatenated.
+          processor.parallel_concat([msg_to_user, generate_trip]),
+      )
+      # Any error substream name is handled by the default processor. Here we
+      # return the input part unchanged.
+      .default(processor.passthrough())
+  )
+
+
+root_agent = adk.ProcessorAgent(
+    create_trip_request_processor,
+    name='trip_request_adk',
+)
diff --git a/genai_processors/core/adk.py b/genai_processors/core/adk.py
@@ -0,0 +1,131 @@
+# Copyright 2025 DeepMind Technologies Limited. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""ADK - GenAI Processors integration."""
+
+from typing import AsyncGenerator, AsyncIterable, Callable, override
+
+from genai_processors import content_api
+from genai_processors import processor
+from google.adk.agents import base_agent
+from google.adk.agents import invocation_context
+from google.adk.events import event as adk_event
+from google.adk.events import event_actions
+from google.genai import types as genai_types
+
+
+class ProcessorAgent(base_agent.BaseAgent):
+  """ADK Custom agent that delegates processing its input to a Processor.
+
+  Works both for turn-based and live modes. In case of turn-based mode the
+  Processor will be called for each user turn with the whole conversation
+  history up to that turn.
+
+  This agent does use ADK token streaming. "Token streaming" checkbox in the ADK
+  UI must be enabled for the response to be rendered correctly. If used
+  programmatically, consumer must either only use events marked as partial=True
+  or turn_complete=True, but not both.
+  """
+
+  def __init__(
+      self, processor_factory: Callable[[], processor.Processor], *, name: str
+  ):
+    """Initializes the ProcessorAgent.
+
+    Args:
+      processor_factory: A function that returns a Processor to be applied to
+        the incoming content. It will be called on each turn and each request.
+        Unless the returned processor is stateless, it must return a new
+        instance every time to avoid state sharing between users.
+      name: The agent's name. It must be a valid Python identifier and unique
+        within the agent tree. It can't be "user", since it's reserved for
+        end-user's input.
+    """
+    super().__init__(name=name)
+    self._processor_factory = processor_factory
+
+  def _append_to_history(
+      self,
+      ctx: invocation_context.InvocationContext,
+      content: genai_types.Content,
+  ) -> adk_event.Event:
+    # Parsing conversation history from the Event log requires handling many
+    # edge cases which ADK considers to be implementation details. Currently
+    # only adk.LlmAgent is priviledged to do that. As a temporary workaround we
+    # will accumulate the history in the state. Downside is that event log
+    # (stored in memory) will grow as n^2.
+    key = f'history_{self.name}'
+    history = ctx.session.state.get(key, [])
+    history.append(content)
+    return adk_event.Event(
+        actions=event_actions.EventActions(state_delta={key: history}),
+        author=self.name,
+    )
+
+  async def _stream_history(
+      self, ctx: invocation_context.InvocationContext
+  ) -> AsyncIterable[content_api.ProcessorPart]:
+    for content in ctx.session.state[f'history_{self.name}']:
+      for part in content.parts:
+        yield content_api.ProcessorPart(part, role=content.role)
+
+  @override
+  async def _run_async_impl(
+      self, ctx: invocation_context.InvocationContext
+  ) -> AsyncGenerator[adk_event.Event, None]:
+    p = self._processor_factory()
+
+    yield self._append_to_history(ctx, ctx.user_content)
+    response = genai_types.Content(parts=[], role='model')
+    async for part in p(self._stream_history(ctx)):
+      yield adk_event.Event(
+          content=genai_types.Content(parts=[part.part], role='model'),
+          author=self.name,
+          partial=True,
+          invocation_id=ctx.invocation_id,
+      )
+      response.parts.append(part.part)
+
+    final_event = self._append_to_history(ctx, response)
+    final_event.content = response
+    final_event.turn_complete = True
+    yield final_event
+
+  @override
+  async def _run_live_impl(
+      self, ctx: invocation_context.InvocationContext
+  ) -> AsyncGenerator[adk_event.Event, None]:
+    async def stream_content():
+      while True:
+        request = await ctx.live_request_queue.get()
+        if request.blob:
+          yield content_api.ProcessorPart(
+              request.blob.data,
+              mimetype=request.blob.mime_type,
+              substream_name='realtime',
+              role='user',
+          )
+        if request.close:
+          # NOTE: Currently ADK Web doesn't close connection and this case is
+          # unreachable. _run_live_impl handlers will leak. Fixing this is in
+          # ADK backlog.
+          break
+
+    p = self._processor_factory()
+    async for part in p(stream_content()):
+      if not part.role:
+        part.role = 'model'
+      yield adk_event.Event(
+          content=genai_types.Content(parts=[part.part]), author=self.name
+      )
diff --git a/genai_processors/tests/adk_test.py b/genai_processors/tests/adk_test.py