diff --git a/dubbo-rpc/dubbo-rpc-api/src/main/java/org/apache/dubbo/rpc/AdaptiveMetrics.java b/dubbo-rpc/dubbo-rpc-api/src/main/java/org/apache/dubbo/rpc/AdaptiveMetrics.java
index dfd077f947a..4627c6b8774 100644
--- a/dubbo-rpc/dubbo-rpc-api/src/main/java/org/apache/dubbo/rpc/AdaptiveMetrics.java
+++ b/dubbo-rpc/dubbo-rpc-api/src/main/java/org/apache/dubbo/rpc/AdaptiveMetrics.java
@@ -46,6 +46,14 @@ public class AdaptiveMetrics {
     private final AtomicLong errorReq = new AtomicLong();
     private double ewma = 0;
 
+    // Coalescing freshness signal: set by setProviderMetrics(), cleared by getLoad().
+    // Indicates whether new provider metrics have arrived since the last getLoad() call.
+    // volatile for cross-thread visibility (setProviderMetrics runs in async executor,
+    // getLoad runs in caller thread). Not an event counter — intermediate updates are
+    // coalesced, which is acceptable because lastLatency and ewma are already updated
+    // to the latest values in setProviderMetrics().
+    private volatile boolean providerUpdated = false;
+
     public double getLoad(String idKey, int weight, int timeout) {
         AdaptiveMetrics metrics = getStatus(idKey);
 
@@ -57,11 +65,13 @@ public double getLoad(String idKey, int weight, int timeout) {
         if (metrics.currentTime > 0) {
             long multiple = (System.currentTimeMillis() - metrics.currentTime) / timeout + 1;
             if (multiple > 0) {
-                if (metrics.currentProviderTime == metrics.currentTime) {
-                    // penalty value
-                    metrics.lastLatency = timeout * 2L;
+                if (metrics.providerUpdated) {
+                    // Fresh metrics arrived — use real lastLatency (already set by setProviderMetrics)
+                    metrics.providerUpdated = false;
                 } else {
-                    metrics.lastLatency = metrics.lastLatency >> multiple;
+                    // No fresh metrics — decay with floor to prevent collapse to zero
+                    long floor = Math.max(1L, timeout / 100L);
+                    metrics.lastLatency = Math.max(floor, metrics.lastLatency >> multiple);
                 }
                 metrics.ewma = metrics.beta * metrics.ewma + (1 - metrics.beta) * metrics.lastLatency;
                 metrics.currentTime = System.currentTimeMillis();
@@ -123,5 +133,6 @@ public void setProviderMetrics(String idKey, Map<String, String> metricsMap) {
         metrics.beta = 0.5;
         // Vt =  β * Vt-1 + (1 -  β ) * θt
         metrics.ewma = metrics.beta * metrics.ewma + (1 - metrics.beta) * metrics.lastLatency;
+        metrics.providerUpdated = true;
     }
 }
diff --git a/dubbo-rpc/dubbo-rpc-api/src/test/java/org/apache/dubbo/rpc/AdaptiveMetricsTest.java b/dubbo-rpc/dubbo-rpc-api/src/test/java/org/apache/dubbo/rpc/AdaptiveMetricsTest.java
new file mode 100644
index 00000000000..b024a538fc0
--- /dev/null
+++ b/dubbo-rpc/dubbo-rpc-api/src/test/java/org/apache/dubbo/rpc/AdaptiveMetricsTest.java
@@ -0,0 +1,240 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.dubbo.rpc;
+
+import java.util.HashMap;
+import java.util.Map;
+
+import org.junit.jupiter.api.Test;
+
+import static org.junit.jupiter.api.Assertions.assertEquals;
+import static org.junit.jupiter.api.Assertions.assertTrue;
+
+/**
+ * Unit tests for {@link AdaptiveMetrics}.
+ *
+ * <p>All tests drive through the public API only (no reflection, no Thread.sleep).
+ * Verifies the fix for <a href="https://github.com/apache/dubbo/issues/15810">#15810</a>:
+ * <ul>
+ *   <li>Bug 1: penalty branch overwrites real RT on every normal response</li>
+ *   <li>Bug 2: aggressive bit-shift decay collapses latency to zero</li>
+ * </ul>
+ */
+class AdaptiveMetricsTest {
+
+    private static final String FAST_KEY = "10.0.0.1:20880/com.example.TestService";
+    private static final String SLOW_KEY = "10.0.0.2:20880/com.example.TestService";
+    private static final String MEDIUM_KEY = "10.0.0.3:20880/com.example.TestService";
+    private static final int WEIGHT = 100;
+    private static final int TIMEOUT = 100;
+
+    private Map<String, String> metricsMap(long curTime, long rt, String load) {
+        Map<String, String> map = new HashMap<>();
+        map.put("curTime", String.valueOf(curTime));
+        map.put("rt", String.valueOf(rt));
+        map.put("load", load);
+        return map;
+    }
+
+    /**
+     * Bug 1 core regression: simulate the real request cycle where each
+     * setProviderMetrics() is immediately followed by a getLoad() call.
+     * This is the exact path that triggers the penalty bug on main branch.
+     *
+     * <p>With the bug: penalty overwrites all RTs to timeout*2, so after
+     * 20 rounds fast(10ms) EWMA ≈ 137 and slow(200ms) EWMA ≈ 200, ratio < 1.5x.
+     * With the fix: fast EWMA stays near 10, slow near 200, ratio > 5x.
+     */
+    @Test
+    void freshMetrics_usesRealLatency_notPenalty() {
+        AdaptiveMetrics am = new AdaptiveMetrics();
+
+        // 20 rounds: each round = setProviderMetrics + immediate getLoad (the bug path)
+        double fastLoad = 0;
+        double slowLoad = 0;
+        for (int i = 0; i < 20; i++) {
+            long now = System.currentTimeMillis();
+
+            am.addConsumerReq(FAST_KEY);
+            am.setProviderMetrics(FAST_KEY, metricsMap(now, 10, "0.5"));
+            am.addConsumerSuccess(FAST_KEY);
+            fastLoad = am.getLoad(FAST_KEY, WEIGHT, TIMEOUT);
+
+            am.addConsumerReq(SLOW_KEY);
+            am.setProviderMetrics(SLOW_KEY, metricsMap(now, 200, "0.5"));
+            am.addConsumerSuccess(SLOW_KEY);
+            slowLoad = am.getLoad(SLOW_KEY, WEIGHT, TIMEOUT);
+        }
+
+        // Strong assertion: the ratio must be > 2x.
+        // With penalty bug: ratio ≈ 1.46 (136.7 vs 200.0 EWMA). Fails.
+        // With fix: ratio ≈ 20x (10 vs 200 EWMA). Passes easily.
+        assertTrue(fastLoad > 0, "fastLoad should be > 0");
+        assertTrue(
+                slowLoad / fastLoad > 2.0,
+                "Slow/fast load ratio should be > 2x to prove real RT is used, "
+                        + "got ratio=" + (slowLoad / fastLoad)
+                        + " (fast=" + fastLoad + " slow=" + slowLoad + ")");
+    }
+
+    /**
+     * Bug 2 regression: after multiple decay rounds without new provider metrics,
+     * load must remain above zero. Decay-to-zero would make idle servers appear
+     * "fastest" and attract all traffic.
+     */
+    @Test
+    void decayWithoutUpdate_doesNotReachZero() {
+        AdaptiveMetrics am = new AdaptiveMetrics();
+        long now = System.currentTimeMillis();
+
+        am.addConsumerReq(FAST_KEY);
+        am.setProviderMetrics(FAST_KEY, metricsMap(now, 200, "0.5"));
+        am.addConsumerSuccess(FAST_KEY);
+
+        // First getLoad consumes the providerUpdated flag
+        am.getLoad(FAST_KEY, WEIGHT, TIMEOUT);
+
+        // Multiple getLoad calls without new metrics — all enter decay branch
+        double load = 0;
+        for (int i = 0; i < 50; i++) {
+            load = am.getLoad(FAST_KEY, WEIGHT, TIMEOUT);
+        }
+
+        // With the bug: lastLatency >> large_multiple = 0, ewma -> 0, load -> 0
+        assertTrue(load > 0, "Load should not decay to zero after idle period, got " + load);
+    }
+
+    /**
+     * End-to-end: with 3 servers at different RTs, simulate the real request
+     * cycle (setProviderMetrics + getLoad each round). After 20 rounds the
+     * ordering must be strictly fast < medium < slow.
+     */
+    @Test
+    void multipleServers_fastServerPreferred() {
+        AdaptiveMetrics am = new AdaptiveMetrics();
+
+        double loadFast = 0;
+        double loadMedium = 0;
+        double loadSlow = 0;
+
+        // Each round: report metrics then immediately call getLoad (the real path)
+        for (int round = 0; round < 20; round++) {
+            long now = System.currentTimeMillis();
+
+            am.addConsumerReq(FAST_KEY);
+            am.setProviderMetrics(FAST_KEY, metricsMap(now, 10, "0.5"));
+            am.addConsumerSuccess(FAST_KEY);
+            loadFast = am.getLoad(FAST_KEY, WEIGHT, TIMEOUT);
+
+            am.addConsumerReq(MEDIUM_KEY);
+            am.setProviderMetrics(MEDIUM_KEY, metricsMap(now, 50, "0.5"));
+            am.addConsumerSuccess(MEDIUM_KEY);
+            loadMedium = am.getLoad(MEDIUM_KEY, WEIGHT, TIMEOUT);
+
+            am.addConsumerReq(SLOW_KEY);
+            am.setProviderMetrics(SLOW_KEY, metricsMap(now, 200, "0.5"));
+            am.addConsumerSuccess(SLOW_KEY);
+            loadSlow = am.getLoad(SLOW_KEY, WEIGHT, TIMEOUT);
+        }
+
+        // Strict ordering: fast < medium < slow
+        assertTrue(loadFast < loadMedium, "fast(" + loadFast + ") should be < medium(" + loadMedium + ")");
+        assertTrue(loadMedium < loadSlow, "medium(" + loadMedium + ") should be < slow(" + loadSlow + ")");
+    }
+
+    /**
+     * A server that degrades (RT jumps from 10ms to 500ms) should see its
+     * load score increase. CPU load is held constant to isolate the RT signal.
+     */
+    @Test
+    void degradedServer_loadIncreases() {
+        AdaptiveMetrics am = new AdaptiveMetrics();
+
+        // Warm up with fast responses (CPU fixed at 0.5)
+        for (int i = 0; i < 10; i++) {
+            long now = System.currentTimeMillis();
+            am.addConsumerReq(FAST_KEY);
+            am.setProviderMetrics(FAST_KEY, metricsMap(now, 10, "0.5"));
+            am.addConsumerSuccess(FAST_KEY);
+            am.getLoad(FAST_KEY, WEIGHT, TIMEOUT);
+        }
+        double loadBefore = am.getLoad(FAST_KEY, WEIGHT, TIMEOUT);
+
+        // Server degrades: RT jumps to 500ms, CPU stays at 0.5
+        for (int i = 0; i < 10; i++) {
+            long now = System.currentTimeMillis();
+            am.addConsumerReq(FAST_KEY);
+            am.setProviderMetrics(FAST_KEY, metricsMap(now, 500, "0.5"));
+            am.addConsumerSuccess(FAST_KEY);
+            am.getLoad(FAST_KEY, WEIGHT, TIMEOUT);
+        }
+        double loadAfter = am.getLoad(FAST_KEY, WEIGHT, TIMEOUT);
+
+        assertTrue(
+                loadAfter > loadBefore,
+                "Load should increase after RT degradation (CPU held constant): " + "before=" + loadBefore + " after="
+                        + loadAfter);
+    }
+
+    /**
+     * Guard: out-of-order serviceTime should be discarded by setProviderMetrics.
+     * An older timestamp must not overwrite newer metrics.
+     */
+    @Test
+    void outOfOrderServiceTime_isDiscarded() {
+        AdaptiveMetrics am = new AdaptiveMetrics();
+        long now = System.currentTimeMillis();
+
+        // Set metrics with current time, RT=50ms
+        am.addConsumerReq(FAST_KEY);
+        am.setProviderMetrics(FAST_KEY, metricsMap(now, 50, "0.5"));
+        am.addConsumerSuccess(FAST_KEY);
+        double loadAfterFresh = am.getLoad(FAST_KEY, WEIGHT, TIMEOUT);
+
+        // Attempt to set metrics with an older timestamp, RT=999ms
+        am.addConsumerReq(FAST_KEY);
+        am.setProviderMetrics(FAST_KEY, metricsMap(now - 10000, 999, "1.0"));
+        am.addConsumerSuccess(FAST_KEY);
+        double loadAfterStale = am.getLoad(FAST_KEY, WEIGHT, TIMEOUT);
+
+        // The stale update should have been discarded — load should not spike
+        assertTrue(
+                loadAfterStale <= loadAfterFresh,
+                "Stale metrics should be discarded: loadAfterFresh=" + loadAfterFresh + " loadAfterStale="
+                        + loadAfterStale);
+    }
+
+    /**
+     * Guard: when pickTime exceeds timeout * 2, getLoad must return 0 (forced pick)
+     * to prevent starvation. This behavior must not be broken by the fix.
+     */
+    @Test
+    void forcedPick_notBroken() {
+        AdaptiveMetrics am = new AdaptiveMetrics();
+        long now = System.currentTimeMillis();
+
+        am.addConsumerReq(FAST_KEY);
+        am.setProviderMetrics(FAST_KEY, metricsMap(now, 50, "0.5"));
+        am.addConsumerSuccess(FAST_KEY);
+
+        // Set pickTime far in the past -> triggers forced pick (return 0)
+        am.setPickTime(FAST_KEY, now - TIMEOUT * 3);
+
+        double load = am.getLoad(FAST_KEY, WEIGHT, TIMEOUT);
+        assertEquals(0.0, load, "getLoad should return 0 when pickTime exceeds timeout * 2");
+    }
+}