diff --git a/.release-please-manifest.json b/.release-please-manifest.json
index 09a252282..6a787c5c9 100644
--- a/.release-please-manifest.json
+++ b/.release-please-manifest.json
@@ -1,3 +1,3 @@
 {
-    ".": "1.2.0"
+    ".": "1.3.0"
 }
diff --git a/CHANGELOG.md b/CHANGELOG.md
index c9ae0d827..2d258953d 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,22 @@
 # Changelog
 
+## [1.3.0](https://github.com/google/adk-java/compare/v1.2.0...v1.3.0) (2026-05-13)
+
+
+### Features
+
+* Add ChatCompletionsHTTPClient and support for non-streaming requests ([9529c1a](https://github.com/google/adk-java/commit/9529c1aeecb324e1c00c6bd105df2a0e9f67ed26))
+* Add conversion from LlmRequest to ChatCompletionsRequest ([d37f6ee](https://github.com/google/adk-java/commit/d37f6ee6d8ec036154593b734f1a3b080847cfea))
+* Add SkillSource interface and implementations for loading skills ([509c4aa](https://github.com/google/adk-java/commit/509c4aa75fdc752c2758a1761cbd8946075b310c))
+* Add support for refusal content using "[[REFUSAL]]:" prefix ([e9184c9](https://github.com/google/adk-java/commit/e9184c9846d97f65907667aa2a6bbac1f65fed64))
+* Refactor BigQueryAgentAnalyticsPlugin for async in preparation for GCS offloading ([d837ef0](https://github.com/google/adk-java/commit/d837ef0164cedd284af6caee84911569109ab7e3))
+
+
+### Bug Fixes
+
+* Account for nulls in EventActions and State ([582cf7c](https://github.com/google/adk-java/commit/582cf7c2b6534afaf5edfa501391191478d8d8ea))
+* upgrade Mockito and JaCoCo for Java 25 compatibility ([8574fc5](https://github.com/google/adk-java/commit/8574fc5bb6ac7edae99306b06c0a610f7da60048))
+
 ## [1.2.0](https://github.com/google/adk-java/compare/v1.1.0...v1.2.0) (2026-04-24)
 
 
diff --git a/README.md b/README.md
index 107a6967b..9613078dd 100644
--- a/README.md
+++ b/README.md
@@ -50,13 +50,13 @@ If you're using Maven, add the following to your dependencies:
 <dependency>
   <groupId>com.google.adk</groupId>
   <artifactId>google-adk</artifactId>
-  <version>1.2.0</version>
+  <version>1.3.0</version>
 </dependency>
 <!-- Dev UI -->
 <dependency>
     <groupId>com.google.adk</groupId>
     <artifactId>google-adk-dev</artifactId>
-    <version>1.2.0</version>
+    <version>1.3.0</version>
 </dependency>
 ```
 
diff --git a/a2a/pom.xml b/a2a/pom.xml
index 3e0b049d6..85eb3e0fa 100644
--- a/a2a/pom.xml
+++ b/a2a/pom.xml
@@ -5,7 +5,7 @@
   <parent>
     <groupId>com.google.adk</groupId>
     <artifactId>google-adk-parent</artifactId>
-    <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+    <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
   </parent>
 
   <artifactId>google-adk-a2a</artifactId>
diff --git a/contrib/firestore-session-service/pom.xml b/contrib/firestore-session-service/pom.xml
index 121877444..58f984a31 100644
--- a/contrib/firestore-session-service/pom.xml
+++ b/contrib/firestore-session-service/pom.xml
@@ -20,7 +20,7 @@
     <parent>
         <groupId>com.google.adk</groupId>
         <artifactId>google-adk-parent</artifactId>
-        <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+        <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/contrib/langchain4j/pom.xml b/contrib/langchain4j/pom.xml
index b7e4cb56f..94fb8fa24 100644
--- a/contrib/langchain4j/pom.xml
+++ b/contrib/langchain4j/pom.xml
@@ -20,7 +20,7 @@
     <parent>
         <groupId>com.google.adk</groupId>
         <artifactId>google-adk-parent</artifactId>
-        <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+        <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/contrib/planners/pom.xml b/contrib/planners/pom.xml
index 1f9afa17a..eafe4cdfb 100644
--- a/contrib/planners/pom.xml
+++ b/contrib/planners/pom.xml
@@ -20,7 +20,7 @@
     <parent>
         <groupId>com.google.adk</groupId>
         <artifactId>google-adk-parent</artifactId>
-        <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+        <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/contrib/samples/a2a_basic/pom.xml b/contrib/samples/a2a_basic/pom.xml
index 1e7af90ae..737daf7eb 100644
--- a/contrib/samples/a2a_basic/pom.xml
+++ b/contrib/samples/a2a_basic/pom.xml
@@ -5,7 +5,7 @@
   <parent>
     <groupId>com.google.adk</groupId>
     <artifactId>google-adk-samples</artifactId>
-    <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+    <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
     <relativePath>..</relativePath>
   </parent>
 
diff --git a/contrib/samples/a2a_server/pom.xml b/contrib/samples/a2a_server/pom.xml
index b1414eff4..410c45b16 100644
--- a/contrib/samples/a2a_server/pom.xml
+++ b/contrib/samples/a2a_server/pom.xml
@@ -5,7 +5,7 @@
   <parent>
     <groupId>com.google.adk</groupId>
     <artifactId>google-adk-samples</artifactId>
-    <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+    <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
     <relativePath>..</relativePath>
   </parent>
 
diff --git a/contrib/samples/configagent/pom.xml b/contrib/samples/configagent/pom.xml
index 097323363..08207ad57 100644
--- a/contrib/samples/configagent/pom.xml
+++ b/contrib/samples/configagent/pom.xml
@@ -5,7 +5,7 @@
     <parent>
         <groupId>com.google.adk</groupId>
         <artifactId>google-adk-samples</artifactId>
-        <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+        <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
         <relativePath>..</relativePath>
     </parent>
 
diff --git a/contrib/samples/helloworld/pom.xml b/contrib/samples/helloworld/pom.xml
index 4e6ad4892..be7dc6551 100644
--- a/contrib/samples/helloworld/pom.xml
+++ b/contrib/samples/helloworld/pom.xml
@@ -20,7 +20,7 @@
     <parent>
         <groupId>com.google.adk</groupId>
         <artifactId>google-adk-samples</artifactId>
-        <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+        <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
         <relativePath>..</relativePath>
     </parent>
 
diff --git a/contrib/samples/mcpfilesystem/pom.xml b/contrib/samples/mcpfilesystem/pom.xml
index f4ad43c84..d3ee68cdc 100644
--- a/contrib/samples/mcpfilesystem/pom.xml
+++ b/contrib/samples/mcpfilesystem/pom.xml
@@ -20,7 +20,7 @@
     <parent>
         <groupId>com.google.adk</groupId>
         <artifactId>google-adk-parent</artifactId>
-        <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+        <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
         <relativePath>../../..</relativePath>
     </parent>
 
diff --git a/contrib/samples/pom.xml b/contrib/samples/pom.xml
index d9ce06aa7..d5e9470e7 100644
--- a/contrib/samples/pom.xml
+++ b/contrib/samples/pom.xml
@@ -5,7 +5,7 @@
   <parent>
     <groupId>com.google.adk</groupId>
     <artifactId>google-adk-parent</artifactId>
-    <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+    <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
     <relativePath>../..</relativePath>
   </parent>
 
diff --git a/contrib/spring-ai/pom.xml b/contrib/spring-ai/pom.xml
index 7e8c61a8a..00abe7f27 100644
--- a/contrib/spring-ai/pom.xml
+++ b/contrib/spring-ai/pom.xml
@@ -20,7 +20,7 @@
     <parent>
         <groupId>com.google.adk</groupId>
         <artifactId>google-adk-parent</artifactId>
-        <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+        <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/core/pom.xml b/core/pom.xml
index 53fd51883..f0bafe01b 100644
--- a/core/pom.xml
+++ b/core/pom.xml
@@ -20,7 +20,7 @@
   <parent>
     <groupId>com.google.adk</groupId>
     <artifactId>google-adk-parent</artifactId>
-    <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+    <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
   </parent>
 
   <artifactId>google-adk</artifactId>
diff --git a/core/src/main/java/com/google/adk/Version.java b/core/src/main/java/com/google/adk/Version.java
index 2816d6763..d440f4d9e 100644
--- a/core/src/main/java/com/google/adk/Version.java
+++ b/core/src/main/java/com/google/adk/Version.java
@@ -22,7 +22,7 @@
  */
 public final class Version {
   // Don't touch this, release-please should keep it up to date.
-  public static final String JAVA_ADK_VERSION = "1.2.0"; // x-release-please-released-version
+  public static final String JAVA_ADK_VERSION = "1.3.0"; // x-release-please-released-version
 
   private Version() {}
 }
diff --git a/core/src/main/java/com/google/adk/models/Gemini.java b/core/src/main/java/com/google/adk/models/Gemini.java
index 6f145e1de..40809b85e 100644
--- a/core/src/main/java/com/google/adk/models/Gemini.java
+++ b/core/src/main/java/com/google/adk/models/Gemini.java
@@ -226,21 +226,7 @@ public Flowable<LlmResponse> generateContent(LlmRequest llmRequest, boolean stre
               () ->
                   processRawResponses(
                       Flowable.fromFuture(streamFuture).flatMapIterable(iterable -> iterable)))
-          .filter(
-              llmResponse ->
-                  llmResponse
-                      .content()
-                      .flatMap(Content::parts)
-                      .map(
-                          parts ->
-                              !parts.isEmpty()
-                                  && parts.stream()
-                                      .anyMatch(
-                                          p ->
-                                              p.functionCall().isPresent()
-                                                  || p.functionResponse().isPresent()
-                                                  || p.text().isPresent()))
-                      .orElse(false));
+          .filter(Gemini::shouldEmit);
     } else {
       logger.debug("Sending generateContent request to model {}", effectiveModelName);
       return Flowable.fromFuture(
@@ -298,7 +284,28 @@ static Flowable<LlmResponse> processRawResponses(Flowable<GenerateContentRespons
                   responsesToEmit.add(aggregatedTextResponse);
                   accumulatedText.setLength(0);
                 }
-                responsesToEmit.add(currentProcessedLlmResponse);
+                if (isEmptyTextOnlyResponse(currentProcessedLlmResponse)) {
+                  // Strip the empty-text content while preserving any carried metadata
+                  // (`usageMetadata`, `finishReason`, `modelVersion`, etc.) by emitting a
+                  // content-less response marked as `partial`. This handles the trailing
+                  // `{parts:[{text:""}], finishReason:STOP}` chunk emitted by some Gemini
+                  // preview models (e.g. 3.1-flash-lite) after a function call: keeping
+                  // the chunk as-is would propagate it as a non-partial event whose
+                  // Event#finalResponse() returns true and prematurely terminate
+                  // BaseLlmFlow#run before the function response is sent back to the
+                  // model; dropping it entirely would lose the carried metadata. If the
+                  // chunk carries no useful metadata at all, suppress it outright.
+                  LlmResponse metadataOnly =
+                      currentProcessedLlmResponse.toBuilder()
+                          .content((Content) null)
+                          .partial(true)
+                          .build();
+                  if (hasUsefulMetadata(metadataOnly)) {
+                    responsesToEmit.add(metadataOnly);
+                  }
+                } else {
+                  responsesToEmit.add(currentProcessedLlmResponse);
+                }
               }
               logger.debug("Responses to emit: {}", responsesToEmit);
               return Flowable.fromIterable(responsesToEmit);
@@ -358,6 +365,67 @@ private static LlmResponse thinkingResponseFromText(String accumulatedThoughtTex
         .build();
   }
 
+  /**
+   * Returns true if {@code response} should be emitted downstream by the streaming pipeline.
+   *
+   * <p>Drops chunks that carry neither semantic content (i.e. they are an empty-text-only response
+   * per {@link #isEmptyTextOnlyResponse}) nor any useful metadata (per {@link #hasUsefulMetadata}).
+   *
+   * <p>Package-private for testing.
+   */
+  static boolean shouldEmit(LlmResponse response) {
+    return !isEmptyTextOnlyResponse(response) || hasUsefulMetadata(response);
+  }
+
+  /**
+   * Returns true if {@code response} carries any non-content metadata that should be propagated
+   * downstream (e.g. {@code usageMetadata}, {@code finishReason}, transcriptions, grounding or
+   * error info). Inspects only top-level {@link LlmResponse} fields; the response's content/parts
+   * are intentionally not considered here.
+   */
+  private static boolean hasUsefulMetadata(LlmResponse response) {
+    return response.usageMetadata().isPresent()
+        || response.finishReason().isPresent()
+        || response.errorCode().isPresent()
+        || response.groundingMetadata().isPresent()
+        || response.inputTranscription().isPresent()
+        || response.outputTranscription().isPresent();
+  }
+
+  /**
+   * Returns true if {@code response} consists of exactly one {@link Part} whose only meaningful
+   * payload is an empty text string (i.e. {@code parts:[{text:""}]}). Such a chunk can be safely
+   * dropped from the streaming aggregator because it carries no semantic content for the agent
+   * pipeline. A part is considered to carry semantic content if any of its non-text payloads
+   * ({@code functionCall}, {@code functionResponse}, {@code inlineData}, {@code executableCode},
+   * {@code codeExecutionResult}, {@code fileData}, {@code thoughtSignature}, {@code videoMetadata},
+   * {@code toolCall}, {@code toolResponse}) is present.
+   */
+  private static boolean isEmptyTextOnlyResponse(LlmResponse response) {
+    return response
+        .content()
+        .flatMap(Content::parts)
+        .map(
+            parts -> {
+              if (parts.size() != 1) {
+                return false;
+              }
+              Part part = parts.get(0);
+              return part.text().map(String::isEmpty).orElse(false)
+                  && part.functionCall().isEmpty()
+                  && part.functionResponse().isEmpty()
+                  && part.inlineData().isEmpty()
+                  && part.executableCode().isEmpty()
+                  && part.codeExecutionResult().isEmpty()
+                  && part.fileData().isEmpty()
+                  && part.thoughtSignature().isEmpty()
+                  && part.videoMetadata().isEmpty()
+                  && part.toolCall().isEmpty()
+                  && part.toolResponse().isEmpty();
+            })
+        .orElse(false);
+  }
+
   @Override
   public BaseLlmConnection connect(LlmRequest llmRequest) {
     if (!apiClient.vertexAI()) {
diff --git a/core/src/main/java/com/google/adk/models/chat/ChatCompletionsHttpClient.java b/core/src/main/java/com/google/adk/models/chat/ChatCompletionsHttpClient.java
new file mode 100644
index 000000000..5b2b03a33
--- /dev/null
+++ b/core/src/main/java/com/google/adk/models/chat/ChatCompletionsHttpClient.java
@@ -0,0 +1,256 @@
+/*
+ * Copyright 2026 Google LLC
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *      https://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.google.adk.models.chat;
+
+import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.adk.JsonBaseModel;
+import com.google.adk.models.LlmRequest;
+import com.google.adk.models.LlmResponse;
+import com.google.common.collect.ImmutableMap;
+import com.google.genai.types.HttpOptions;
+import io.reactivex.rxjava3.core.BackpressureStrategy;
+import io.reactivex.rxjava3.core.Flowable;
+import io.reactivex.rxjava3.core.FlowableEmitter;
+import java.io.IOException;
+import java.time.Duration;
+import java.util.Map;
+import java.util.Objects;
+import okhttp3.Call;
+import okhttp3.Callback;
+import okhttp3.HttpUrl;
+import okhttp3.MediaType;
+import okhttp3.OkHttpClient;
+import okhttp3.Request;
+import okhttp3.RequestBody;
+import okhttp3.Response;
+import okhttp3.ResponseBody;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
+/**
+ * An HTTP client for interacting with OpenAI-compatible chat completions endpoints.
+ *
+ * <p>Supports both non-streaming responses (single {@link LlmResponse} emission) and streaming
+ * Server-Sent Events (SSE) responses (multiple incremental {@link LlmResponse} emissions). See the
+ * <a href="https://developers.openai.com/api/reference/resources/chat">OpenAI Chat Completions API
+ * reference</a> for the wire protocol.
+ */
+public class ChatCompletionsHttpClient {
+  private static final Logger logger = LoggerFactory.getLogger(ChatCompletionsHttpClient.class);
+  private static final ObjectMapper objectMapper = JsonBaseModel.getMapper();
+
+  private static final MediaType JSON = MediaType.get("application/json; charset=utf-8");
+
+  /**
+   * Default OkHttp call timeout used when the caller does not supply an {@link HttpOptions}
+   * timeout. Five minutes is long enough for most non-streaming completions and short enough to
+   * prevent indefinite hangs in the common case where the caller does not configure timeouts.
+   * Callers who need infinite (e.g. long batch jobs or open streams) can opt in by passing an
+   * {@link HttpOptions} with {@code timeout() == 0}.
+   */
+  private static final Duration DEFAULT_CALL_TIMEOUT = Duration.ofMinutes(5);
+
+  /**
+   * Shared OkHttpClient instance whose connection pool and thread dispatcher are reused across all
+   * {@link ChatCompletionsHttpClient} instances. Each instance forks this client via {@link
+   * OkHttpClient#newBuilder()} to apply per-instance timeouts without leaking pools.
+   */
+  private static final OkHttpClient SHARED_POOL_CLIENT = new OkHttpClient();
+
+  private final OkHttpClient client;
+  private final HttpUrl completionsUrl;
+  private final ImmutableMap<String, String> headers;
+
+  /**
+   * Constructs a new {@link ChatCompletionsHttpClient} that facilitates API interaction with the
+   * standard {@code /chat/completions} REST endpoint.
+   *
+   * <p>All configuration is sourced from the supplied {@link HttpOptions}:
+   *
+   * <ul>
+   *   <li>{@link HttpOptions#baseUrl()} -- <b>required</b>. The base URL of the chat completions
+   *       endpoint. The {@code chat/completions} path segments are appended automatically using
+   *       {@link HttpUrl}, which handles trailing slashes and percent-encoding deterministically.
+   *       Set via {@code HttpOptions.builder().baseUrl("https://...").build()}.
+   *   <li>{@link HttpOptions#headers()} -- optional. Extra HTTP headers to include in outgoing
+   *       requests. The {@code Content-Type} header is set automatically and cannot be overridden.
+   *       Set via {@code HttpOptions.builder().headers(Map.of("Authorization", "Bearer ...")) }.
+   *   <li>{@link HttpOptions#timeout()} -- optional. Per-call timeout in milliseconds. A missing
+   *       timeout defaults to 5 minutes ({@link #DEFAULT_CALL_TIMEOUT}). A timeout of {@code 0} is
+   *       respected as the explicit caller opt-in to infinite wait. Set via {@code
+   *       HttpOptions.builder().timeout(10_000).build()}.
+   * </ul>
+   *
+   * <p>Example:
+   *
+   * <pre>{@code
+   * HttpOptions options =
+   *     HttpOptions.builder()
+   *         .baseUrl("https://example.com/v1/")
+   *         .headers(ImmutableMap.of("Authorization", "Bearer my-token"))
+   *         .timeout(30_000)
+   *         .build();
+   * ChatCompletionsHttpClient client = new ChatCompletionsHttpClient(options);
+   * }</pre>
+   *
+   * @param httpOptions HTTP configuration. Must not be {@code null}, and {@link
+   *     HttpOptions#baseUrl()} must be present and parseable as an HTTP(S) URL.
+   * @throws IllegalArgumentException if {@code httpOptions.baseUrl()} is missing or is not a valid
+   *     HTTP(S) URL.
+   */
+  public ChatCompletionsHttpClient(HttpOptions httpOptions) {
+    Objects.requireNonNull(httpOptions, "httpOptions cannot be null");
+    String baseUrl =
+        httpOptions
+            .baseUrl()
+            .orElseThrow(() -> new IllegalArgumentException("httpOptions.baseUrl() must be set"));
+    HttpUrl parsedBaseUrl = HttpUrl.parse(baseUrl);
+    if (parsedBaseUrl == null) {
+      throw new IllegalArgumentException(
+          "httpOptions.baseUrl() is not a valid HTTP(S) URL: " + baseUrl);
+    }
+    // Pre-build the completions URL once. HttpUrl.addPathSegment handles trailing slashes,
+    // percent-encoding, and existing path components on baseUrl deterministically.
+    this.completionsUrl =
+        parsedBaseUrl.newBuilder().addPathSegment("chat").addPathSegment("completions").build();
+    // Defensive copy of caller-supplied headers; absent is treated as no extra headers.
+    this.headers =
+        httpOptions
+            .headers()
+            .<ImmutableMap<String, String>>map(ImmutableMap::copyOf)
+            .orElse(ImmutableMap.of());
+
+    // Apply custom timeouts per instance. All internal timeouts are bounded by callTimeout.
+    OkHttpClient.Builder builder = SHARED_POOL_CLIENT.newBuilder();
+    builder.connectTimeout(Duration.ZERO);
+    builder.readTimeout(Duration.ZERO);
+    builder.writeTimeout(Duration.ZERO);
+    builder.callTimeout(resolveCallTimeout(httpOptions));
+    this.client = builder.build();
+  }
+
+  /** Resolves the call timeout from HttpOptions. */
+  private static Duration resolveCallTimeout(HttpOptions httpOptions) {
+    if (httpOptions.timeout().isEmpty()) {
+      return DEFAULT_CALL_TIMEOUT;
+    }
+    long timeoutMs = httpOptions.timeout().get();
+    // 0 is treated as no timeout (Duration.ZERO).
+    return timeoutMs == 0L ? Duration.ZERO : Duration.ofMillis(timeoutMs);
+  }
+
+  /**
+   * Generates a conversational response from the chat completions endpoint based on the provided
+   * messages. This encapsulates building the HTTP payload, sending the request to the completions
+   * endpoint, and initiating the handling of complete calls.
+   *
+   * @param llmRequest The request containing the model, configuration, and sequence of messages.
+   * @param stream Whether to request a streaming response.
+   * @return A {@link Flowable} emitting the discrete (or combined) {@link LlmResponse} objects.
+   */
+  public Flowable<LlmResponse> complete(LlmRequest llmRequest, boolean stream) {
+    return Flowable.defer(
+        () -> {
+          ChatCompletionsRequest dtoRequest =
+              ChatCompletionsRequest.fromLlmRequest(llmRequest, stream);
+          String jsonPayload = objectMapper.writeValueAsString(dtoRequest);
+          logger.trace(
+              "Chat Completion Request: model={}, stream={}, messagesCount={}",
+              dtoRequest.model,
+              dtoRequest.stream,
+              dtoRequest.messages != null ? dtoRequest.messages.size() : 0);
+
+          Request.Builder requestBuilder =
+              new Request.Builder().url(completionsUrl).post(RequestBody.create(jsonPayload, JSON));
+
+          for (Map.Entry<String, String> entry : headers.entrySet()) {
+            requestBuilder.addHeader(entry.getKey(), entry.getValue());
+          }
+          // Defensively force Content-Type to JSON by replacing instead of appending.
+          requestBuilder.header("Content-Type", JSON.toString());
+
+          Request request = requestBuilder.build();
+          if (stream) {
+            return createStreamingFlowable(request);
+          } else {
+            return createNonStreamingFlowable(request);
+          }
+        });
+  }
+
+  /** Placeholder for streaming responses. Errors with {@link UnsupportedOperationException}. */
+  @SuppressWarnings("UnusedVariable")
+  private Flowable<LlmResponse> createStreamingFlowable(Request request) {
+    return Flowable.error(
+        new UnsupportedOperationException("Streaming is not yet implemented in this client."));
+  }
+
+  /**
+   * Wraps an OkHttp {@link Callback} in a reactive {@link Flowable} for single-turn, non-streaming
+   * responses.
+   */
+  private Flowable<LlmResponse> createNonStreamingFlowable(Request request) {
+    return Flowable.create(
+        emitter -> {
+          Call call = client.newCall(request);
+          emitter.setCancellable(call::cancel);
+          call.enqueue(new NonStreamingCallback(emitter));
+        },
+        BackpressureStrategy.BUFFER);
+  }
+
+  /**
+   * Handles OkHttp failure and success callbacks, pushing {@link LlmResponse} results to the given
+   * emitter.
+   */
+  private static final class NonStreamingCallback implements Callback {
+    private final FlowableEmitter<LlmResponse> emitter;
+
+    NonStreamingCallback(FlowableEmitter<LlmResponse> emitter) {
+      this.emitter = emitter;
+    }
+
+    @Override
+    public void onFailure(Call call, IOException e) {
+      emitter.tryOnError(e);
+    }
+
+    @Override
+    public void onResponse(Call call, Response response) {
+      try (ResponseBody body = response.body()) {
+        if (!response.isSuccessful()) {
+          String bodyStr = body != null ? body.string() : "";
+          emitter.tryOnError(
+              new IOException("Unexpected code " + response + " - body: " + bodyStr));
+          return;
+        }
+        if (body == null) {
+          emitter.tryOnError(new IOException("Empty response body"));
+          return;
+        }
+
+        String jsonResponse = body.string();
+        ChatCompletionsResponse.ChatCompletion completion =
+            objectMapper.readValue(jsonResponse, ChatCompletionsResponse.ChatCompletion.class);
+        emitter.onNext(completion.toLlmResponse());
+        emitter.onComplete();
+      } catch (Exception e) {
+        emitter.tryOnError(e);
+      }
+    }
+  }
+}
diff --git a/core/src/test/java/com/google/adk/models/GeminiTest.java b/core/src/test/java/com/google/adk/models/GeminiTest.java
index c230f5f68..656b5e596 100644
--- a/core/src/test/java/com/google/adk/models/GeminiTest.java
+++ b/core/src/test/java/com/google/adk/models/GeminiTest.java
@@ -63,6 +63,81 @@ public void processRawResponses_withTextChunks_emitsPartialResponses() {
         isFunctionCallResponse());
   }
 
+  // Regression test for b/513501918. gemini-3.1-flash-lite emits an extra trailing chunk after a
+  // function call: `{parts:[{text:""}], finishReason:STOP}`. That chunk must not be propagated as
+  // a non-partial event because BaseLlmFlow#run would treat it as the final response and
+  // terminate the loop before the function response is sent back to the model. The chunk's
+  // metadata (e.g. `finishReason`, `usageMetadata`) is preserved by emitting it on a content-less
+  // partial response instead of dropping the chunk entirely.
+  @Test
+  public void
+      processRawResponses_functionCallThenEmptyTextWithStop_emitsFunctionCallAndMetadataOnlyPartial() {
+    Flowable<GenerateContentResponse> rawResponses =
+        Flowable.just(
+            toResponse(Part.fromFunctionCall("test_function", ImmutableMap.of())),
+            toResponseWithText("", FinishReason.Known.STOP));
+
+    Flowable<LlmResponse> llmResponses = Gemini.processRawResponses(rawResponses);
+
+    assertLlmResponses(
+        llmResponses,
+        isFunctionCallResponse(),
+        isContentlessPartialWithFinishReason(FinishReason.Known.STOP));
+  }
+
+  // Same as above but with `usageMetadata` on the trailing empty chunk: the metadata must survive
+  // on the emitted content-less partial.
+  @Test
+  public void
+      processRawResponses_functionCallThenEmptyTextWithUsageMetadata_preservesUsageMetadata() {
+    GenerateContentResponseUsageMetadata metadata = createUsageMetadata(5, 10, 15);
+    Flowable<GenerateContentResponse> rawResponses =
+        Flowable.just(
+            toResponse(Part.fromFunctionCall("test_function", ImmutableMap.of())),
+            toResponseWithText("", FinishReason.Known.STOP, metadata));
+
+    Flowable<LlmResponse> llmResponses = Gemini.processRawResponses(rawResponses);
+
+    assertLlmResponses(
+        llmResponses, isFunctionCallResponse(), isContentlessPartialWithUsageMetadata(metadata));
+  }
+
+  // Same as above but without a finishReason or usageMetadata: the trailing empty chunk carries no
+  // useful payload and must be suppressed entirely.
+  @Test
+  public void processRawResponses_functionCallThenEmptyText_doesNotEmitExtraEmptyResponse() {
+    Flowable<GenerateContentResponse> rawResponses =
+        Flowable.just(
+            toResponse(Part.fromFunctionCall("test_function", ImmutableMap.of())),
+            toResponseWithText(""));
+
+    Flowable<LlmResponse> llmResponses = Gemini.processRawResponses(rawResponses);
+
+    assertLlmResponses(llmResponses, isFunctionCallResponse());
+  }
+
+  // Combined scenario: leading partial text, then a function call, then the trailing empty-text
+  // chunk with STOP. Accumulated text must still be flushed, the function call must still be
+  // emitted, and the trailing chunk must surface only its metadata on a content-less partial.
+  @Test
+  public void
+      processRawResponses_textThenFunctionCallThenEmptyTextWithStop_emitsTextFunctionCallAndMetadata() {
+    Flowable<GenerateContentResponse> rawResponses =
+        Flowable.just(
+            toResponseWithText("Thinking..."),
+            toResponse(Part.fromFunctionCall("test_function", ImmutableMap.of())),
+            toResponseWithText("", FinishReason.Known.STOP));
+
+    Flowable<LlmResponse> llmResponses = Gemini.processRawResponses(rawResponses);
+
+    assertLlmResponses(
+        llmResponses,
+        isPartialTextResponse("Thinking..."),
+        isFinalTextResponse("Thinking..."),
+        isFunctionCallResponse(),
+        isContentlessPartialWithFinishReason(FinishReason.Known.STOP));
+  }
+
   @Test
   public void processRawResponses_textAndStopReason_emitsPartialThenFinalText() {
     Flowable<GenerateContentResponse> rawResponses =
@@ -175,6 +250,93 @@ public void processRawResponses_thoughtChunksAndStop_includeUsageMetadata() {
         isFinalThoughtResponseWithUsageMetadata("Thinking deeply", metadata2));
   }
 
+  // Test cases for the shouldEmit filter applied by generateContent after processRawResponses.
+  // shouldEmit drops chunks that are empty-text-only AND carry no useful metadata; everything else
+  // is forwarded. processRawResponses normally already strips empty-text-only chunks, so shouldEmit
+  // is defense-in-depth, but it must still behave correctly when fed any LlmResponse directly.
+
+  @Test
+  public void shouldEmit_emptyTextOnlyResponseWithNoMetadata_returnsFalse() {
+    LlmResponse response =
+        LlmResponse.builder()
+            .content(Content.builder().role("model").parts(Part.fromText("")).build())
+            .build();
+
+    assertThat(Gemini.shouldEmit(response)).isFalse();
+  }
+
+  @Test
+  public void shouldEmit_emptyTextOnlyResponseWithFinishReason_returnsTrue() {
+    LlmResponse response =
+        LlmResponse.builder()
+            .content(Content.builder().role("model").parts(Part.fromText("")).build())
+            .finishReason(new FinishReason(FinishReason.Known.STOP))
+            .build();
+
+    assertThat(Gemini.shouldEmit(response)).isTrue();
+  }
+
+  @Test
+  public void shouldEmit_emptyTextOnlyResponseWithUsageMetadata_returnsTrue() {
+    LlmResponse response =
+        LlmResponse.builder()
+            .content(Content.builder().role("model").parts(Part.fromText("")).build())
+            .usageMetadata(createUsageMetadata(5, 10, 15))
+            .build();
+
+    assertThat(Gemini.shouldEmit(response)).isTrue();
+  }
+
+  @Test
+  public void shouldEmit_nonEmptyTextResponse_returnsTrue() {
+    LlmResponse response =
+        LlmResponse.builder()
+            .content(Content.builder().role("model").parts(Part.fromText("hello")).build())
+            .build();
+
+    assertThat(Gemini.shouldEmit(response)).isTrue();
+  }
+
+  @Test
+  public void shouldEmit_functionCallResponse_returnsTrue() {
+    LlmResponse response =
+        LlmResponse.builder()
+            .content(
+                Content.builder()
+                    .role("model")
+                    .parts(Part.fromFunctionCall("test_function", ImmutableMap.of()))
+                    .build())
+            .build();
+
+    assertThat(Gemini.shouldEmit(response)).isTrue();
+  }
+
+  @Test
+  public void shouldEmit_contentlessResponse_returnsTrue() {
+    // A response with no content at all is not an empty-text-only response, so it should pass
+    // through regardless of metadata. This is the shape emitted by processRawResponses after it
+    // strips empty-text content while preserving metadata.
+    LlmResponse response = LlmResponse.builder().build();
+
+    assertThat(Gemini.shouldEmit(response)).isTrue();
+  }
+
+  @Test
+  public void shouldEmit_multiPartResponseWithEmptyTextPart_returnsTrue() {
+    // Only single-part empty-text responses are considered "empty-text-only". A multi-part response
+    // is treated as carrying semantic content and must always pass through.
+    LlmResponse response =
+        LlmResponse.builder()
+            .content(
+                Content.builder()
+                    .role("model")
+                    .parts(Part.fromText(""), Part.fromText("hello"))
+                    .build())
+            .build();
+
+    assertThat(Gemini.shouldEmit(response)).isTrue();
+  }
+
   @Test
   public void processRawResponses_thoughtAndTextWithStop_onlyFinalTextIncludesUsageMetadata() {
     GenerateContentResponseUsageMetadata metadata1 = createUsageMetadata(5, 5, 10);
@@ -232,6 +394,26 @@ private static Predicate<LlmResponse> isFunctionCallResponse() {
     };
   }
 
+  private static Predicate<LlmResponse> isContentlessPartialWithFinishReason(
+      FinishReason.Known expectedFinishReason) {
+    return response -> {
+      assertThat(response.partial()).hasValue(true);
+      assertThat(response.content()).isEmpty();
+      assertThat(response.finishReason().map(fr -> fr.knownEnum())).hasValue(expectedFinishReason);
+      return true;
+    };
+  }
+
+  private static Predicate<LlmResponse> isContentlessPartialWithUsageMetadata(
+      GenerateContentResponseUsageMetadata expectedMetadata) {
+    return response -> {
+      assertThat(response.partial()).hasValue(true);
+      assertThat(response.content()).isEmpty();
+      assertThat(response.usageMetadata()).hasValue(expectedMetadata);
+      return true;
+    };
+  }
+
   private static Predicate<LlmResponse> isEmptyResponse() {
     return response -> {
       assertThat(response.partial()).isEmpty();
diff --git a/core/src/test/java/com/google/adk/models/chat/ChatCompletionsHttpClientTest.java b/core/src/test/java/com/google/adk/models/chat/ChatCompletionsHttpClientTest.java
new file mode 100644
index 000000000..175ca777e
--- /dev/null
+++ b/core/src/test/java/com/google/adk/models/chat/ChatCompletionsHttpClientTest.java
@@ -0,0 +1,477 @@
+/*
+ * Copyright 2026 Google LLC
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *      https://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.google.adk.models.chat;
+
+import static com.google.common.truth.Truth.assertThat;
+import static java.util.concurrent.TimeUnit.MILLISECONDS;
+import static org.junit.Assert.assertThrows;
+import static org.mockito.ArgumentMatchers.any;
+import static org.mockito.Mockito.doNothing;
+import static org.mockito.Mockito.verify;
+import static org.mockito.Mockito.when;
+
+import com.fasterxml.jackson.databind.JsonNode;
+import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.adk.JsonBaseModel;
+import com.google.adk.models.LlmRequest;
+import com.google.adk.models.LlmResponse;
+import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableMap;
+import com.google.genai.types.Content;
+import com.google.genai.types.FinishReason;
+import com.google.genai.types.HttpOptions;
+import com.google.genai.types.Part;
+import io.reactivex.rxjava3.subscribers.TestSubscriber;
+import java.io.IOException;
+import java.lang.reflect.Field;
+import java.time.Duration;
+import okhttp3.Call;
+import okhttp3.Callback;
+import okhttp3.MediaType;
+import okhttp3.OkHttpClient;
+import okhttp3.Protocol;
+import okhttp3.Request;
+import okhttp3.Response;
+import okhttp3.ResponseBody;
+import okio.Buffer;
+import org.junit.Before;
+import org.junit.Rule;
+import org.junit.Test;
+import org.junit.runner.RunWith;
+import org.junit.runners.JUnit4;
+import org.mockito.ArgumentCaptor;
+import org.mockito.Mock;
+import org.mockito.junit.MockitoJUnit;
+import org.mockito.junit.MockitoRule;
+
+@RunWith(JUnit4.class)
+public final class ChatCompletionsHttpClientTest {
+  private static final ObjectMapper objectMapper = JsonBaseModel.getMapper();
+  private static final MediaType JSON = MediaType.get("application/json");
+
+  /**
+   * Bounded wait for {@link TestSubscriber#await} so a buggy callback wiring cannot hang the test
+   * JVM. The mock callbacks fire synchronously in the same thread, so this value is intentionally
+   * short -- on a successful run the await returns in microseconds, and on a hung run we fail fast
+   * instead of stalling the test suite.
+   */
+  private static final Duration AWAIT_TIMEOUT = Duration.ofMillis(500);
+
+  @Rule public final MockitoRule mocks = MockitoJUnit.rule();
+
+  @Mock private OkHttpClient mockHttpClient;
+  @Mock private Call mockCall;
+
+  private ChatCompletionsHttpClient client;
+
+  @Before
+  public void setUp() throws Exception {
+    client =
+        new ChatCompletionsHttpClient(
+            HttpOptions.builder().baseUrl("https://example.com/").build());
+    swapInMockHttpClient(client);
+  }
+
+  /**
+   * Reflectively replaces the production {@link OkHttpClient} on a {@link
+   * ChatCompletionsHttpClient} with the test's mock so callbacks can be captured. Used by both
+   * setUp and tests that construct their own client (e.g. timeout tests, header tests).
+   */
+  private void swapInMockHttpClient(ChatCompletionsHttpClient target) throws Exception {
+    when(mockHttpClient.newCall(any())).thenReturn(mockCall);
+    Field clientField = ChatCompletionsHttpClient.class.getDeclaredField("client");
+    clientField.setAccessible(true);
+    clientField.set(target, mockHttpClient);
+  }
+
+  private Response createMockResponse(String body, MediaType mediaType) {
+    return createMockResponse(body, mediaType, 200, "OK");
+  }
+
+  private Response createMockResponse(String body, MediaType mediaType, int code, String message) {
+    Response.Builder builder =
+        new Response.Builder()
+            .request(new Request.Builder().url("https://example.com/chat/completions").build())
+            .protocol(Protocol.HTTP_1_1)
+            .code(code)
+            .message(message);
+    // OkHttp's Response.Builder rejects a null body via its Kotlin @NotNull contract; omit
+    // the body() call entirely to model an empty/null response body.
+    if (body != null) {
+      builder.body(ResponseBody.create(body, mediaType));
+    }
+    return builder.build();
+  }
+
+  /** Returns a minimal {@link LlmRequest} suitable for tests that don't care about the payload. */
+  private static LlmRequest minimalRequest() {
+    return LlmRequest.builder()
+        .model("gpt-4")
+        .contents(ImmutableList.of(Content.builder().parts(Part.fromText("hello")).build()))
+        .build();
+  }
+
+  @Test
+  public void complete_nonStreaming_sendsCorrectPayload() throws Exception {
+    String responseBody =
+        """
+        {
+          "choices": [
+            {
+              "message": {
+                "role": "assistant",
+                "content": "Hi"
+              },
+              "finish_reason": "stop"
+            }
+          ]
+        }
+        """;
+
+    Response mockResponse = createMockResponse(responseBody, JSON);
+
+    ArgumentCaptor<Callback> callbackCaptor = ArgumentCaptor.forClass(Callback.class);
+    doNothing().when(mockCall).enqueue(callbackCaptor.capture());
+
+    TestSubscriber<LlmResponse> testSubscriber = client.complete(minimalRequest(), false).test();
+
+    callbackCaptor.getValue().onResponse(mockCall, mockResponse);
+    testSubscriber.await(AWAIT_TIMEOUT.toMillis(), MILLISECONDS);
+
+    LlmResponse response = testSubscriber.values().get(0);
+
+    ArgumentCaptor<Request> requestCaptor = ArgumentCaptor.forClass(Request.class);
+    verify(mockHttpClient).newCall(requestCaptor.capture());
+    Request capturedRequest = requestCaptor.getValue();
+    assertThat(capturedRequest.url().encodedPath()).isEqualTo("/chat/completions");
+
+    Buffer buffer = new Buffer();
+    capturedRequest.body().writeTo(buffer);
+    JsonNode requestBodyJson = objectMapper.readTree(buffer.readUtf8());
+    assertThat(requestBodyJson.get("model").asText()).isEqualTo("gpt-4");
+    assertThat(requestBodyJson.get("messages").get(0).get("role").asText()).isEqualTo("user");
+    assertThat(requestBodyJson.get("messages").get(0).get("content").asText()).isEqualTo("hello");
+
+    LlmResponse expectedResponse =
+        LlmResponse.builder()
+            .content(
+                Content.builder()
+                    .role("model")
+                    .parts(ImmutableList.of(Part.fromText("Hi")))
+                    .build())
+            .finishReason(new FinishReason(FinishReason.Known.STOP.toString()))
+            .customMetadata(ImmutableList.of())
+            .build();
+
+    assertThat(response).isEqualTo(expectedResponse);
+  }
+
+  @Test
+  public void complete_nonStreaming_propagateFailure() throws Exception {
+    ArgumentCaptor<Callback> callbackCaptor = ArgumentCaptor.forClass(Callback.class);
+    doNothing().when(mockCall).enqueue(callbackCaptor.capture());
+
+    TestSubscriber<LlmResponse> testSubscriber = client.complete(minimalRequest(), false).test();
+
+    callbackCaptor.getValue().onFailure(mockCall, new IOException("Network Error"));
+    testSubscriber.await(AWAIT_TIMEOUT.toMillis(), MILLISECONDS);
+
+    testSubscriber.assertError(IOException.class);
+  }
+
+  // -- Header, error-propagation, and timeout coverage. ----------------------------------
+
+  /**
+   * Verifies that an HTTP error status (e.g. 500) propagates as a stream error and that the error
+   * message includes the response body so callers can debug. Covers the {@code
+   * !response.isSuccessful()} branch of the non-streaming path. The streaming counterpart lives in
+   * the streaming follow-up CL.
+   */
+  @Test
+  public void complete_nonStreaming_propagatesHttpErrorStatus() throws Exception {
+    Response mockResponse =
+        createMockResponse("{\"error\":\"server exploded\"}", JSON, 500, "Internal Server Error");
+
+    ArgumentCaptor<Callback> callbackCaptor = ArgumentCaptor.forClass(Callback.class);
+    doNothing().when(mockCall).enqueue(callbackCaptor.capture());
+
+    TestSubscriber<LlmResponse> testSubscriber = client.complete(minimalRequest(), false).test();
+
+    callbackCaptor.getValue().onResponse(mockCall, mockResponse);
+    testSubscriber.await(AWAIT_TIMEOUT.toMillis(), MILLISECONDS);
+
+    testSubscriber.assertError(
+        e ->
+            e instanceof IOException
+                && e.getMessage().contains("Unexpected code")
+                && e.getMessage().contains("server exploded"));
+  }
+
+  /**
+   * Verifies that an empty response body propagates as a stream error rather than silently emitting
+   * an empty value. The exact exception class depends on OkHttp's behavior:
+   *
+   * <ul>
+   *   <li>If OkHttp produces a {@code null} body, our code surfaces an {@link IOException} with the
+   *       message {@code "Empty response body"}.
+   *   <li>If OkHttp produces an empty (non-null) body, Jackson surfaces a {@link
+   *       com.fasterxml.jackson.databind.exc.MismatchedInputException} ("No content to map").
+   * </ul>
+   *
+   * Both outcomes satisfy the contract: empty body must NOT silently produce a successful empty
+   * {@link LlmResponse}.
+   */
+  @Test
+  public void complete_nonStreaming_propagatesEmptyBody() throws Exception {
+    Response mockResponse = createMockResponse(null, JSON);
+
+    ArgumentCaptor<Callback> callbackCaptor = ArgumentCaptor.forClass(Callback.class);
+    doNothing().when(mockCall).enqueue(callbackCaptor.capture());
+
+    TestSubscriber<LlmResponse> testSubscriber = client.complete(minimalRequest(), false).test();
+
+    callbackCaptor.getValue().onResponse(mockCall, mockResponse);
+    testSubscriber.await(AWAIT_TIMEOUT.toMillis(), MILLISECONDS);
+
+    testSubscriber.assertNoValues();
+    testSubscriber.assertError(Throwable.class);
+  }
+
+  /**
+   * Verifies that caller-supplied headers reach the wire on the captured {@link Request}. This is
+   * the most common production failure mode (missing or wrong Authorization header), so it gets its
+   * own test rather than being implicit in other tests.
+   */
+  @Test
+  public void complete_sendsCustomHeaders() throws Exception {
+    ChatCompletionsHttpClient clientWithHeaders =
+        new ChatCompletionsHttpClient(
+            HttpOptions.builder()
+                .baseUrl("https://example.com/")
+                .headers(ImmutableMap.of("Authorization", "Bearer test-token", "X-Custom", "value"))
+                .build());
+    swapInMockHttpClient(clientWithHeaders);
+
+    String responseBody =
+        """
+        {"choices":[{"message":{"role":"assistant","content":"Hi"},"finish_reason":"stop"}]}
+        """;
+    Response mockResponse = createMockResponse(responseBody, JSON);
+
+    ArgumentCaptor<Callback> callbackCaptor = ArgumentCaptor.forClass(Callback.class);
+    doNothing().when(mockCall).enqueue(callbackCaptor.capture());
+
+    TestSubscriber<LlmResponse> testSubscriber =
+        clientWithHeaders.complete(minimalRequest(), false).test();
+
+    callbackCaptor.getValue().onResponse(mockCall, mockResponse);
+    testSubscriber.await(AWAIT_TIMEOUT.toMillis(), MILLISECONDS);
+
+    ArgumentCaptor<Request> requestCaptor = ArgumentCaptor.forClass(Request.class);
+    verify(mockHttpClient).newCall(requestCaptor.capture());
+    Request capturedRequest = requestCaptor.getValue();
+    assertThat(capturedRequest.header("Authorization")).isEqualTo("Bearer test-token");
+    assertThat(capturedRequest.header("X-Custom")).isEqualTo("value");
+    // Content-Type is forced to application/json regardless of caller input.
+    assertThat(capturedRequest.header("Content-Type")).contains("application/json");
+  }
+
+  /**
+   * Verifies that even when a caller passes a conflicting {@code Content-Type} header, the client
+   * overrides it with {@code application/json} so the upstream API does not reject the request as a
+   * malformed payload.
+   */
+  @Test
+  public void complete_overridesCallerContentType() throws Exception {
+    ChatCompletionsHttpClient clientWithBadHeader =
+        new ChatCompletionsHttpClient(
+            HttpOptions.builder()
+                .baseUrl("https://example.com/")
+                .headers(ImmutableMap.of("Content-Type", "text/plain"))
+                .build());
+    swapInMockHttpClient(clientWithBadHeader);
+
+    String responseBody =
+        """
+        {"choices":[{"message":{"role":"assistant","content":"Hi"},"finish_reason":"stop"}]}
+        """;
+    Response mockResponse = createMockResponse(responseBody, JSON);
+
+    ArgumentCaptor<Callback> callbackCaptor = ArgumentCaptor.forClass(Callback.class);
+    doNothing().when(mockCall).enqueue(callbackCaptor.capture());
+
+    TestSubscriber<LlmResponse> testSubscriber =
+        clientWithBadHeader.complete(minimalRequest(), false).test();
+
+    callbackCaptor.getValue().onResponse(mockCall, mockResponse);
+    testSubscriber.await(AWAIT_TIMEOUT.toMillis(), MILLISECONDS);
+
+    ArgumentCaptor<Request> requestCaptor = ArgumentCaptor.forClass(Request.class);
+    verify(mockHttpClient).newCall(requestCaptor.capture());
+    Request capturedRequest = requestCaptor.getValue();
+    // Should be exactly one Content-Type header, not two.
+    assertThat(capturedRequest.headers("Content-Type")).hasSize(1);
+    assertThat(capturedRequest.header("Content-Type")).contains("application/json");
+  }
+
+  /**
+   * Verifies that a {@code baseUrl} without a trailing slash still produces the correct {@code
+   * /chat/completions} path. {@link okhttp3.HttpUrl#newBuilder()} normalizes path segments
+   * regardless of the trailing-slash state of the base URL.
+   */
+  @Test
+  public void complete_handlesBaseUrlWithoutTrailingSlash() throws Exception {
+    ChatCompletionsHttpClient clientNoSlash =
+        new ChatCompletionsHttpClient(HttpOptions.builder().baseUrl("https://example.com").build());
+    swapInMockHttpClient(clientNoSlash);
+
+    String responseBody =
+        """
+        {"choices":[{"message":{"role":"assistant","content":"Hi"},"finish_reason":"stop"}]}
+        """;
+    Response mockResponse = createMockResponse(responseBody, JSON);
+
+    ArgumentCaptor<Callback> callbackCaptor = ArgumentCaptor.forClass(Callback.class);
+    doNothing().when(mockCall).enqueue(callbackCaptor.capture());
+
+    TestSubscriber<LlmResponse> testSubscriber =
+        clientNoSlash.complete(minimalRequest(), false).test();
+
+    callbackCaptor.getValue().onResponse(mockCall, mockResponse);
+    testSubscriber.await(AWAIT_TIMEOUT.toMillis(), MILLISECONDS);
+
+    ArgumentCaptor<Request> requestCaptor = ArgumentCaptor.forClass(Request.class);
+    verify(mockHttpClient).newCall(requestCaptor.capture());
+    assertThat(requestCaptor.getValue().url().encodedPath()).isEqualTo("/chat/completions");
+  }
+
+  /**
+   * Verifies that omitting {@code headers} on the supplied {@link HttpOptions} is treated as no
+   * extra headers, not as an NPE.
+   */
+  @Test
+  public void constructor_missingHeaders_isTreatedAsEmpty() throws Exception {
+    ChatCompletionsHttpClient clientWithoutHeaders =
+        new ChatCompletionsHttpClient(
+            HttpOptions.builder().baseUrl("https://example.com/").build());
+    swapInMockHttpClient(clientWithoutHeaders);
+
+    String responseBody =
+        """
+        {"choices":[{"message":{"role":"assistant","content":"Hi"},"finish_reason":"stop"}]}
+        """;
+    Response mockResponse = createMockResponse(responseBody, JSON);
+
+    ArgumentCaptor<Callback> callbackCaptor = ArgumentCaptor.forClass(Callback.class);
+    doNothing().when(mockCall).enqueue(callbackCaptor.capture());
+
+    TestSubscriber<LlmResponse> testSubscriber =
+        clientWithoutHeaders.complete(minimalRequest(), false).test();
+
+    callbackCaptor.getValue().onResponse(mockCall, mockResponse);
+    testSubscriber.await(AWAIT_TIMEOUT.toMillis(), MILLISECONDS);
+
+    testSubscriber.assertNoErrors();
+    testSubscriber.assertValueCount(1);
+  }
+
+  /** Verifies that a {@code null} {@link HttpOptions} is rejected at construction time. */
+  @Test
+  public void constructor_nullHttpOptions_throws() {
+    assertThrows(NullPointerException.class, () -> new ChatCompletionsHttpClient(null));
+  }
+
+  /**
+   * Verifies that an {@link HttpOptions} without a {@code baseUrl} is rejected at construction time
+   * as bad configuration. {@link IllegalArgumentException} (not NPE) is the conventional signal for
+   * missing required configuration.
+   */
+  @Test
+  public void constructor_missingBaseUrl_throws() {
+    HttpOptions noBaseUrl = HttpOptions.builder().build();
+    assertThrows(IllegalArgumentException.class, () -> new ChatCompletionsHttpClient(noBaseUrl));
+  }
+
+  /**
+   * Verifies that an {@link HttpOptions} with a malformed (non-HTTP(S)) {@code baseUrl} is rejected
+   * at construction time, rather than failing later at the first {@code complete()} call with a
+   * confusing NPE from {@link okhttp3.HttpUrl#parse}.
+   */
+  @Test
+  public void constructor_malformedBaseUrl_throws() {
+    HttpOptions malformed = HttpOptions.builder().baseUrl("not a url").build();
+    assertThrows(IllegalArgumentException.class, () -> new ChatCompletionsHttpClient(malformed));
+  }
+
+  // -- Tri-state timeout policy. ----------------------------------------------------------
+
+  /**
+   * Verifies that when {@code httpOptions} omits {@code timeout()}, the client applies the 5-minute
+   * default call timeout to prevent indefinite hangs in callers that did not explicitly configure a
+   * timeout.
+   */
+  @Test
+  public void constructor_missingTimeout_appliesDefaultFiveMinuteTimeout() {
+    ChatCompletionsHttpClient defaultClient =
+        new ChatCompletionsHttpClient(
+            HttpOptions.builder().baseUrl("https://example.com/").build());
+
+    OkHttpClient internal = readInternalClient(defaultClient);
+    assertThat(internal.callTimeoutMillis())
+        .isEqualTo((int) Duration.ofMinutes(5).toMillis()); // 300_000
+  }
+
+  /**
+   * Verifies that when the caller explicitly sets {@code httpOptions.timeout() == 0}, the client
+   * respects this as the explicit opt-in to infinite hang. This is the migration path for
+   * long-running streams or batch jobs that need no timeout.
+   */
+  @Test
+  public void constructor_zeroTimeout_respectsInfiniteHang() {
+    HttpOptions zeroTimeout =
+        HttpOptions.builder().baseUrl("https://example.com/").timeout(0).build();
+    ChatCompletionsHttpClient infiniteClient = new ChatCompletionsHttpClient(zeroTimeout);
+
+    OkHttpClient internal = readInternalClient(infiniteClient);
+    assertThat(internal.callTimeoutMillis()).isEqualTo(0); // OkHttp: 0 = no timeout
+  }
+
+  /**
+   * Verifies that when the caller sets a positive timeout, that value (in milliseconds) is used as
+   * the call timeout.
+   */
+  @Test
+  public void constructor_explicitTimeout_appliesIt() {
+    HttpOptions tenSeconds =
+        HttpOptions.builder().baseUrl("https://example.com/").timeout(10_000).build();
+    ChatCompletionsHttpClient timedClient = new ChatCompletionsHttpClient(tenSeconds);
+
+    OkHttpClient internal = readInternalClient(timedClient);
+    assertThat(internal.callTimeoutMillis()).isEqualTo(10_000);
+  }
+
+  /** Reflectively reads the internal {@link OkHttpClient} to inspect the resolved timeout. */
+  private static OkHttpClient readInternalClient(ChatCompletionsHttpClient target) {
+    try {
+      Field clientField = ChatCompletionsHttpClient.class.getDeclaredField("client");
+      clientField.setAccessible(true);
+      return (OkHttpClient) clientField.get(target);
+    } catch (ReflectiveOperationException e) {
+      throw new LinkageError("Failed to read internal client", e);
+    }
+  }
+}
diff --git a/dev/pom.xml b/dev/pom.xml
index bf89e7ca6..998c146e2 100644
--- a/dev/pom.xml
+++ b/dev/pom.xml
@@ -18,7 +18,7 @@
   <parent>
     <groupId>com.google.adk</groupId>
     <artifactId>google-adk-parent</artifactId>
-    <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+    <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
   </parent>
 
   <artifactId>google-adk-dev</artifactId>
diff --git a/maven_plugin/examples/custom_tools/pom.xml b/maven_plugin/examples/custom_tools/pom.xml
index 38bc9b561..58538fbea 100644
--- a/maven_plugin/examples/custom_tools/pom.xml
+++ b/maven_plugin/examples/custom_tools/pom.xml
@@ -4,7 +4,7 @@
 
     <groupId>com.example</groupId>
     <artifactId>custom-tools-example</artifactId>
-    <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+    <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
     <packaging>jar</packaging>
 
     <name>ADK Custom Tools Example</name>
diff --git a/maven_plugin/examples/simple-agent/pom.xml b/maven_plugin/examples/simple-agent/pom.xml
index c713f525d..03cfce1cb 100644
--- a/maven_plugin/examples/simple-agent/pom.xml
+++ b/maven_plugin/examples/simple-agent/pom.xml
@@ -4,7 +4,7 @@
 
     <groupId>com.example</groupId>
     <artifactId>simple-adk-agent</artifactId>
-    <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+    <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
     <packaging>jar</packaging>
 
     <name>Simple ADK Agent Example</name>
diff --git a/maven_plugin/pom.xml b/maven_plugin/pom.xml
index f87df835d..500329f03 100644
--- a/maven_plugin/pom.xml
+++ b/maven_plugin/pom.xml
@@ -5,7 +5,7 @@
     <parent>
         <groupId>com.google.adk</groupId>
         <artifactId>google-adk-parent</artifactId>
-        <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+        <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
         <relativePath>../pom.xml</relativePath>
     </parent>
 
diff --git a/pom.xml b/pom.xml
index 73e0ccbaa..665b696a0 100644
--- a/pom.xml
+++ b/pom.xml
@@ -17,7 +17,7 @@
 
   <groupId>com.google.adk</groupId>
   <artifactId>google-adk-parent</artifactId>
-  <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+  <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
   <packaging>pom</packaging>
 
   <name>Google Agent Development Kit Maven Parent POM</name>
@@ -55,7 +55,7 @@
     <google.genai.version>1.44.0</google.genai.version>
     <protobuf.version>4.33.5</protobuf.version>
     <junit.version>5.11.4</junit.version>
-    <mockito.version>5.20.0</mockito.version>
+    <mockito.version>5.23.0</mockito.version>
     <java-websocket.version>1.6.0</java-websocket.version>
     <jackson.version>2.20.2</jackson.version>
     <okhttp.version>5.3.2</okhttp.version>
@@ -73,7 +73,7 @@
     <assertj.version>3.27.7</assertj.version>
     <anthropic.version>2.15.0</anthropic.version>
     <maven-plugin-tools.version>3.9.0</maven-plugin-tools.version>
-    <httpclient5.version>5.6</httpclient5.version>
+    <httpclient5.version>5.6.1</httpclient5.version>
     <netty.version>4.1.118.Final</netty.version>
     <surefire.argLine>@{jacoco.agent.argLine} --add-opens=java.base/java.nio=ALL-UNNAMED --add-opens=java.base/sun.nio.ch=ALL-UNNAMED --add-opens=java.base/java.util.concurrent=ALL-UNNAMED --add-opens=java.base/java.text=ALL-UNNAMED --add-opens=java.base/java.util=ALL-UNNAMED --add-opens=java.base/java.lang=ALL-UNNAMED --add-opens=java.base/java.lang.reflect=ALL-UNNAMED --add-opens=java.base/jdk.internal.misc=ALL-UNNAMED -Dio.netty.tryReflectionSetAccessible=true</surefire.argLine>
   </properties>
@@ -454,7 +454,7 @@
       <plugin>
         <groupId>org.jacoco</groupId>
         <artifactId>jacoco-maven-plugin</artifactId>
-        <version>0.8.12</version>
+        <version>0.8.14</version>
         <executions>
           <execution>
             <goals>
diff --git a/tutorials/city-time-weather/pom.xml b/tutorials/city-time-weather/pom.xml
index f63dc96a8..5a559d7a4 100644
--- a/tutorials/city-time-weather/pom.xml
+++ b/tutorials/city-time-weather/pom.xml
@@ -20,7 +20,7 @@
   <parent>
     <groupId>com.google.adk</groupId>
     <artifactId>google-adk-parent</artifactId>
-    <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+    <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/tutorials/live-audio-single-agent/pom.xml b/tutorials/live-audio-single-agent/pom.xml
index 3c4475b6a..764289fcb 100644
--- a/tutorials/live-audio-single-agent/pom.xml
+++ b/tutorials/live-audio-single-agent/pom.xml
@@ -20,7 +20,7 @@
   <parent>
     <groupId>com.google.adk</groupId>
     <artifactId>google-adk-parent</artifactId>
-    <version>1.2.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
+    <version>1.3.1-SNAPSHOT</version><!-- {x-version-update:google-adk:current} -->
     <relativePath>../../pom.xml</relativePath>
   </parent>