envoyproxy · yanavlasov · Dec 16, 2025 · Mar 13, 2025 · Jul 10, 2025 · Jul 11, 2025
diff --git a/api/envoy/extensions/filters/http/ext_proc/v3/BUILD b/api/envoy/extensions/filters/http/ext_proc/v3/BUILD
@@ -6,6 +6,7 @@ licenses(["notice"])  # Apache 2
 
 api_proto_package(
     deps = [
+        "//envoy/annotations:pkg",
         "//envoy/config/common/mutation_rules/v3:pkg",
         "//envoy/config/core/v3:pkg",
         "//envoy/type/matcher/v3:pkg",

diff --git a/api/envoy/extensions/filters/http/ext_proc/v3/ext_proc.proto b/api/envoy/extensions/filters/http/ext_proc/v3/ext_proc.proto
@@ -16,6 +16,7 @@ import "google/protobuf/wrappers.proto";
 
 import "xds/annotations/v3/status.proto";
 
+import "envoy/annotations/deprecation.proto";
 import "udpa/annotations/migrate.proto";
 import "udpa/annotations/status.proto";
 import "validate/validate.proto";
@@ -48,18 +49,24 @@ option (udpa.annotations.file_status).package_version_status = ACTIVE;
 //
 // * Whether it receives the response message at all.
 // * Whether it receives the message body at all, in separate chunks, or as a single buffer.
-// * Whether subsequent HTTP requests are transmitted synchronously or whether they are
-//   sent asynchronously.
 // * To modify request or response trailers if they already exist.
 //
 // The filter supports up to six different processing steps. Each is represented by
 // a gRPC stream message that is sent to the external processor. For each message, the
 // processor must send a matching response.
 //
 // * Request headers: Contains the headers from the original HTTP request.
-// * Request body: Delivered if they are present and sent in a single message if
-//   the ``BUFFERED`` or ``BUFFERED_PARTIAL`` mode is chosen, in multiple messages if the
-//   ``STREAMED`` mode is chosen, and not at all otherwise.
+// * Request body: If the body is present, the behavior depends on the
+//   body send mode:
+//   * ``BUFFERED`` or ``BUFFERED_PARTIAL``: Entire body is sent to the
+//     external processor in a single message.
+//   * ``STREAMED`` or ``FULL_DUPLEX_STREAMED``: Body will be split across
+//     multiple messages sent to the external processor.
+//   * ``GRPC``: As each gRPC message arrives, it will be sent to the external
+//     processor. There will be exactly one gRPC message in each message
+//     sent to the external processor.
+//   * ``NONE``: Body will not be sent to the external processor.
+//
 // * Request trailers: Delivered if they are present and if the trailer mode is set
 //   to ``SEND``.
 // * Response headers: Contains the headers from the HTTP response. Keep in mind
@@ -75,7 +82,7 @@ option (udpa.annotations.file_status).package_version_status = ACTIVE;
 // from the external processor. The latter is only enabled if ``allow_mode_override`` is
 // set to true. This way, a processor may, for example, use information
 // in the request header to determine whether the message body must be examined, or whether
-// the proxy should simply stream it straight through.
+// the data plane should simply stream it straight through.
 //
 // All of this together allows a server to process the filter traffic in fairly
 // sophisticated ways. For example:
@@ -84,12 +91,8 @@ option (udpa.annotations.file_status).package_version_status = ACTIVE;
 //   on the content of the headers.
 // * A server may choose to immediately reject some messages based on their HTTP
 //   headers (or other dynamic metadata) and more carefully examine others.
-// * A server may asynchronously monitor traffic coming through the filter by inspecting
-//   headers, bodies, or both, and then decide to switch to a synchronous processing
-//   mode, either permanently or temporarily.
 //
-// The protocol itself is based on a bidirectional gRPC stream. Envoy will send the
-// server
+// The protocol itself is based on a bidirectional gRPC stream. The data plane will send the server
 // :ref:`ProcessingRequest <envoy_v3_api_msg_service.ext_proc.v3.ProcessingRequest>`
 // messages, and the server must reply with
 // :ref:`ProcessingResponse <envoy_v3_api_msg_service.ext_proc.v3.ProcessingResponse>`.
@@ -124,7 +127,6 @@ message ExternalProcessor {
   reserved "async_mode";
 
   // Configuration for the gRPC service that the filter will communicate with.
-  // The filter supports both the "Envoy" and "Google" gRPC clients.
   // Only one of ``grpc_service`` or ``http_service`` can be set.
   // It is required that one of them must be set.
   config.core.v3.GrpcService grpc_service = 1
@@ -140,14 +142,14 @@ message ExternalProcessor {
   // cannot be configured to send any body or trailers. i.e., ``http_service`` only supports
   // sending request or response headers to the side stream server.
   //
-  // With this configuration, Envoy behavior:
+  // With this configuration, the data plane behavior is:
   //
   // 1. The headers are first put in a proto message
   // :ref:`ProcessingRequest <envoy_v3_api_msg_service.ext_proc.v3.ProcessingRequest>`.
   //
   // 2. This proto message is then transcoded into a JSON text.
   //
-  // 3. Envoy then sends an HTTP POST message with content-type as "application/json",
+  // 3. The data plane then sends an HTTP POST message with content-type as "application/json",
   // and this JSON text as body to the side stream server.
   //
   // After the side-stream receives this HTTP request message, it is expected to do as follows:
@@ -160,7 +162,7 @@ message ExternalProcessor {
   //
   // 3. It converts the ``ProcessingResponse`` proto message into a JSON text.
   //
-  // 4. It then sends an HTTP response back to Envoy with status code as ``"200"``,
+  // 4. It then sends an HTTP response back to the data plane with status code as ``"200"``,
   // ``content-type`` as ``"application/json"`` and sets the JSON text as the body.
   //
   ExtProcHttpService http_service = 20 [
@@ -194,28 +196,30 @@ message ExternalProcessor {
   // sent. See ``ProcessingMode`` for details.
   ProcessingMode processing_mode = 3;
 
-  // Envoy provides a number of :ref:`attributes <arch_overview_attributes>`
+  // The data plane provides a number of :ref:`attributes <arch_overview_attributes>`
   // for expressive policies. Each attribute name provided in this field will be
-  // matched against that list and populated in the ``request_headers`` message.
+  // matched against that list and populated in the
+  // :ref:`ProcessingRequest.attributes <envoy_v3_api_field_service.ext_proc.v3.ProcessingRequest.attributes>` field.
   // See the :ref:`attribute documentation <arch_overview_request_attributes>`
   // for the list of supported attributes and their types.
   repeated string request_attributes = 5;
 
-  // Envoy provides a number of :ref:`attributes <arch_overview_attributes>`
+  // The data plane provides a number of :ref:`attributes <arch_overview_attributes>`
   // for expressive policies. Each attribute name provided in this field will be
-  // matched against that list and populated in the ``response_headers`` message.
+  // matched against that list and populated in the
+  // :ref:`ProcessingRequest.attributes <envoy_v3_api_field_service.ext_proc.v3.ProcessingRequest.attributes>` field.
   // See the :ref:`attribute documentation <arch_overview_attributes>`
   // for the list of supported attributes and their types.
   repeated string response_attributes = 6;
 
-  // Specifies the timeout for each individual message sent on the stream and
-  // when the filter is running in synchronous mode. Whenever the proxy sends
-  // a message on the stream that requires a response, it will reset this timer,
-  // and will stop processing and return an error (subject to the processing mode)
-  // if the timer expires before a matching response is received. There is no
-  // timeout when the filter is running in asynchronous mode. Zero is a valid
-  // config which means the timer will be triggered immediately. If not
-  // configured, default is 200 milliseconds.
+  // Specifies the timeout for each individual message sent on the stream.
+  // Whenever the data plane sends a message on the stream that requires a
+  // response, it will reset this timer, and will stop processing and return
+  // an error (subject to the processing mode) if the timer expires before a
+  // matching response is received. There is no timeout when the filter is
+  // running in observability mode. Zero is a valid config which means the
+  // timer will be triggered immediately. If not configured, default is 200
+  // milliseconds.
   google.protobuf.Duration message_timeout = 7 [(validate.rules).duration = {
     lte {seconds: 3600}
     gte {}
@@ -232,7 +236,7 @@ message ExternalProcessor {
   // :ref:`header_prefix <envoy_v3_api_field_config.bootstrap.v3.Bootstrap.header_prefix>`
   // (which is usually "x-envoy").
   // Note that changing headers such as "host" or ":authority" may not in itself
-  // change Envoy's routing decision, as routes can be cached. To also force the
+  // change the data plane's routing decision, as routes can be cached. To also force the
   // route to be recomputed, set the
   // :ref:`clear_route_cache <envoy_v3_api_field_service.ext_proc.v3.CommonResponse.clear_route_cache>`
   // field to true in the same response.
@@ -274,10 +278,11 @@ message ExternalProcessor {
 
   // If true, send each part of the HTTP request or response specified by ``ProcessingMode``
   // without pausing on filter chain iteration. It is "Send and Go" mode that can be used
-  // by external processor to observe Envoy data and status. In this mode:
+  // by external processor to observe the request's data and status. In this mode:
   //
-  // 1. Only ``STREAMED`` body processing mode is supported and any other body processing modes will be
-  // ignored. ``NONE`` mode (i.e., skip body processing) will still work as expected.
+  // 1. Only ``STREAMED`` and ``GRPC`` body processing modes are supported and any other body
+  // processing modes will be ignored. ``NONE`` mode (i.e., skip body processing) will still
+  // work as expected.
   //
   // 2. External processor should not send back processing response, as any responses will be ignored.
   // This also means that
@@ -314,12 +319,13 @@ message ExternalProcessor {
   // Specifies the deferred closure timeout for gRPC stream that connects to external processor. Currently, the deferred stream closure
   // is only used in :ref:`observability_mode <envoy_v3_api_field_extensions.filters.http.ext_proc.v3.ExternalProcessor.observability_mode>`.
   // In observability mode, gRPC streams may be held open to the external processor longer than the lifetime of the regular client to
-  // backend stream lifetime. In this case, Envoy will eventually timeout the external processor stream according to this time limit.
+  // backend stream lifetime. In this case, the data plane will eventually timeout the external processor stream according to this time limit.
   // The default value is 5000 milliseconds (5 seconds) if not specified.
   google.protobuf.Duration deferred_close_timeout = 19;
 
   // Send body to the side stream server once it arrives without waiting for the header response from that server.
-  // It only works for ``STREAMED`` body processing mode. For any other body processing modes, it is ignored.
+  // It only works for ``STREAMED`` and ``GRPC`` body processing modes. For any other body
+  // processing modes, it is ignored.
   // The server has two options upon receiving a header request:
   //
   // 1. Instant Response: send the header response as soon as the header request is received.
@@ -328,9 +334,9 @@ message ExternalProcessor {
   //
   // In all scenarios, the header-body ordering must always be maintained.
   //
-  // If enabled Envoy will ignore the
+  // If enabled the data plane will ignore the
   // :ref:`mode_override <envoy_v3_api_field_service.ext_proc.v3.ProcessingResponse.mode_override>`
-  // value that the server sends in the header response. This is because Envoy may have already
+  // value that the server sends in the header response. This is because the data plane may have already
   // sent the body to the server, prior to processing the header response.
   bool send_body_without_waiting_for_header_response = 21;
 
@@ -434,7 +440,8 @@ message ExtProcOverrides {
 
   // [#not-implemented-hide:]
   // Set a different asynchronous processing option than the default.
-  bool async_mode = 2;
+  // Deprecated and not implemented.
+  bool async_mode = 2 [deprecated = true, (envoy.annotations.deprecated_at_minor_version) = "3.0"];
 
   // [#not-implemented-hide:]
   // Set different optional attributes than the default setting of the

diff --git a/api/envoy/extensions/filters/http/ext_proc/v3/processing_mode.proto b/api/envoy/extensions/filters/http/ext_proc/v3/processing_mode.proto
@@ -65,8 +65,7 @@ message ProcessingMode {
     // Do not send the body at all. This is the default.
     NONE = 0;
 
-    // Stream the body to the server in pieces as they arrive at the
-    // proxy.
+    // Stream the body to the server in pieces as they are seen.
     STREAMED = 1;
 
     // Buffer the message body in memory and send the entire body at once.
@@ -79,11 +78,11 @@ message ProcessingMode {
     // up to the buffer limit will be sent.
     BUFFERED_PARTIAL = 3;
 
-    // Envoy streams the body to the server in pieces as they arrive.
+    // The ext_proc client streams the body to the server in pieces as they arrive.
     //
     // 1) The server may choose to buffer any number chunks of data before processing them.
     // After it finishes buffering, the server processes the buffered data. Then it splits the processed
-    // data into any number of chunks, and streams them back to Envoy one by one.
+    // data into any number of chunks, and streams them back to the client one by one.
     // The server may continuously do so until the complete body is processed.
     // The individual response chunk size is recommended to be no greater than 64K bytes, or
     // :ref:`max_receive_message_length <envoy_v3_api_field_config.core.v3.GrpcService.EnvoyGrpc.max_receive_message_length>`
@@ -98,17 +97,29 @@ message ProcessingMode {
     //
     // In this body mode:
     // * The corresponding trailer mode has to be set to ``SEND``.
-    // * Envoy will send body and trailers (if present) to the server as they arrive.
+    // * The client will send body and trailers (if present) to the server as they arrive.
     //   Sending the trailers (if present) is to inform the server the complete body arrives.
-    //   In case there are no trailers, then Envoy will set
+    //   In case there are no trailers, then the client will set
     //   :ref:`end_of_stream <envoy_v3_api_field_service.ext_proc.v3.HttpBody.end_of_stream>`
     //   to true as part of the last body chunk request to notify the server that no other data is to be sent.
     // * The server needs to send
     //   :ref:`StreamedBodyResponse <envoy_v3_api_msg_service.ext_proc.v3.StreamedBodyResponse>`
-    //   to Envoy in the body response.
-    // * Envoy will stream the body chunks in the responses from the server to the upstream/downstream as they arrive.
+    //   to the client in the body response.
+    // * The client will stream the body chunks in the responses from the server to the upstream/downstream as they arrive.
 
     FULL_DUPLEX_STREAMED = 4;
+
+    // [#not-implemented-hide:]
+    // gRPC traffic. In this mode, the ext_proc client will de-frame the
+    // individual gRPC messages inside the HTTP/2 DATA frames, and as each
+    // message is de-framed, it will be sent to the ext_proc server as a
+    // :ref:`request_body
+    // <envoy_v3_api_field_service.ext_proc.v3.ProcessingRequest.request_body>`
+    // or :ref:`response_body
+    // <envoy_v3_api_field_service.ext_proc.v3.ProcessingRequest.response_body>`.
+    // If the ext_proc server modifies the body, that modified body will
+    // be used to replace the gRPC message in the stream.
+    GRPC = 5;
   }
 
   // How to handle the request header. Default is "SEND".