From 247b4ed4c04314c10f9e32c81c6dea73b0398dc2 Mon Sep 17 00:00:00 2001
From: 761417898 <761417898@qq.com>
Date: Thu, 30 Apr 2026 15:07:24 +0800
Subject: [PATCH 1/5] Fix TS_2DIFF float/double page compatibility and harden
 gtest zip validation.

Align C++ float/double TS_2DIFF flush/read behavior with Java overflow-page layout, and prevent 0-byte/corrupt googletest archives from being treated as successful downloads during test configuration.
---
 cpp/src/common/allocator/byte_stream.h  |  15 +++
 cpp/src/encoding/ts2diff_decoder.h      |  54 ++++++++++
 cpp/src/encoding/ts2diff_encoder.h      | 130 ++++++++++++++++++++++++
 cpp/test/CMakeLists.txt                 |  73 ++++++++++---
 cpp/test/encoding/ts2diff_codec_test.cc |  77 ++++++++++++++
 5 files changed, 336 insertions(+), 13 deletions(-)
diff --git a/cpp/src/common/allocator/byte_stream.h b/cpp/src/common/allocator/byte_stream.h
index 6d08744c3..dddc00b81 100644
--- a/cpp/src/common/allocator/byte_stream.h
+++ b/cpp/src/common/allocator/byte_stream.h
@@ -347,6 +347,21 @@ class ByteStream {
 
     FORCE_INLINE uint32_t total_size() const { return total_size_.load(); }
     FORCE_INLINE uint32_t read_pos() const { return read_pos_; };
+    /**
+     * Seek the read cursor to an absolute offset. Re-anchors read_page_ for
+     * multi-page streams.
+     */
+    void set_read_pos(uint32_t pos) {
+        ASSERT(pos <= total_size());
+        read_pos_ = pos;
+        Page* p = head_.load();
+        uint32_t skipped = 0;
+        while (p != nullptr && skipped + page_size_ <= pos) {
+            skipped += page_size_;
+            p = p->next_.load();
+        }
+        read_page_ = p;
+    }
     FORCE_INLINE void wrapped_buf_advance_read_pos(uint32_t size) {
         if (size + read_pos_ > total_size_.load()) {
             read_pos_ = total_size_.load();
diff --git a/cpp/src/encoding/ts2diff_decoder.h b/cpp/src/encoding/ts2diff_decoder.h
index 32584546d..258f04337 100644
--- a/cpp/src/encoding/ts2diff_decoder.h
+++ b/cpp/src/encoding/ts2diff_decoder.h
@@ -30,6 +30,43 @@
 #include "utils/util_define.h"
 
 namespace storage {
+
+namespace ts2diff_java_detail {
+
+// Java FloatEncoder overflow flush uses Integer.MAX_VALUE - 1; FloatDecoder
+// then reads BitMaps and Float.intBitsToFloat for float/double TS_2DIFF pages.
+constexpr uint32_t kJavaFloatTs2DiffOverflowMagic =
+    2147483646u;  // Integer.MAX_VALUE - 1
+
+inline int consume_float_double_ts2diff_prefix(common::ByteStream& in) {
+    int ret = common::E_OK;
+    uint32_t mark = in.read_pos();
+    uint32_t tag = 0;
+    if (RET_FAIL(common::SerializationUtil::read_var_uint(tag, in))) {
+        return ret;
+    }
+    if (tag == kJavaFloatTs2DiffOverflowMagic) {
+        uint32_t n = 0;
+        if (RET_FAIL(common::SerializationUtil::read_var_uint(n, in))) {
+            return ret;
+        }
+        int bm_len = static_cast<int>(n) / 8 + 1;
+        uint32_t skip_to = in.read_pos() + static_cast<uint32_t>(bm_len * 2);
+        in.set_read_pos(skip_to);
+        uint32_t inner_max_point = 0;
+        if (RET_FAIL(common::SerializationUtil::read_var_uint(inner_max_point,
+                                                              in))) {
+            return ret;
+        }
+        (void)inner_max_point;
+    } else {
+        in.set_read_pos(mark);
+    }
+    return common::E_OK;
+}
+
+}  // namespace ts2diff_java_detail
+
 template <typename T>
 class TS2DIFFDecoder : public Decoder {
    public:
@@ -295,6 +332,16 @@ FORCE_INLINE int FloatTS2DIFFDecoder::read_int64(int64_t& ret_value,
 }
 FORCE_INLINE int FloatTS2DIFFDecoder::read_float(float& ret_value,
                                                  common::ByteStream& in) {
+    int ret = common::E_OK;
+    // Each encoder flush() emits a self-contained Java-compatible segment.
+    // TS_2DIFFDecoder resets current_index_ to 0 at block boundaries; align
+    // the outer FloatEncoder wrapper before reading each new inner block.
+    if (current_index_ == 0) {
+        if (RET_FAIL(
+                ts2diff_java_detail::consume_float_double_ts2diff_prefix(in))) {
+            return ret;
+        }
+    }
     ret_value = decode(in);
     return common::E_OK;
 }
@@ -325,6 +372,13 @@ FORCE_INLINE int DoubleTS2DIFFDecoder::read_float(float& ret_value,
 }
 FORCE_INLINE int DoubleTS2DIFFDecoder::read_double(double& ret_value,
                                                    common::ByteStream& in) {
+    int ret = common::E_OK;
+    if (current_index_ == 0) {
+        if (RET_FAIL(
+                ts2diff_java_detail::consume_float_double_ts2diff_prefix(in))) {
+            return ret;
+        }
+    }
     ret_value = decode(in);
     return common::E_OK;
 }
diff --git a/cpp/src/encoding/ts2diff_encoder.h b/cpp/src/encoding/ts2diff_encoder.h
index 8c5ddafc7..bd51d2cc9 100644
--- a/cpp/src/encoding/ts2diff_encoder.h
+++ b/cpp/src/encoding/ts2diff_encoder.h
@@ -22,6 +22,8 @@
 
 #include <sys/types.h>
 
+#include <vector>
+
 #include "common/allocator/alloc_base.h"
 #include "common/allocator/byte_stream.h"
 #include "encoder.h"
@@ -275,6 +277,7 @@ class FloatTS2DIFFEncoder : public TS2DIFFEncoder<int32_t> {
         int32_t value_int = common::float_to_int(value);
         return TS2DIFFEncoder<int32_t>::do_encode(value_int, out_stream);
     }
+    int flush(common::ByteStream& out_stream) override;
     int encode(bool value, common::ByteStream& out_stream);
     int encode(int32_t value, common::ByteStream& out_stream);
     int encode(int64_t value, common::ByteStream& out_stream);
@@ -288,6 +291,7 @@ class DoubleTS2DIFFEncoder : public TS2DIFFEncoder<int64_t> {
         int64_t value_long = common::double_to_long(value);
         return TS2DIFFEncoder<int64_t>::do_encode(value_long, out_stream);
     }
+    int flush(common::ByteStream& out_stream) override;
     int encode(bool value, common::ByteStream& out_stream);
     int encode(int32_t value, common::ByteStream& out_stream);
     int encode(int64_t value, common::ByteStream& out_stream);
@@ -402,5 +406,131 @@ FORCE_INLINE int DoubleTS2DIFFEncoder::encode(double value,
     return do_encode(value, out);
 }
 
+// Align with Java FloatEncoder TS_2DIFF page layout (overflow flush): outer
+// header + BitMaps so FloatDecoder uses Float.intBitsToFloat on every value
+// (C++ stores IEEE float bits, not scaled decimals).
+FORCE_INLINE int FloatTS2DIFFEncoder::flush(common::ByteStream& out_stream) {
+    int ret = common::E_OK;
+    if (write_index_ == -1) {
+        return common::E_OK;
+    }
+    const int num_values = write_index_ + 1;
+    common::ByteStream inner(1024, common::MOD_TS2DIFF_OBJ, false);
+    if (RET_FAIL(common::SerializationUtil::write_var_uint(0u, inner))) {
+        return ret;
+    }
+    SIMDOps<int32_t>::rebase(delta_arr_, delta_arr_min_, write_index_);
+    int bit_width = cal_bit_width(delta_arr_max_ - delta_arr_min_);
+    if (RET_FAIL(common::SerializationUtil::write_ui32(
+            static_cast<uint32_t>(write_index_), inner))) {
+        return ret;
+    }
+    if (RET_FAIL(common::SerializationUtil::write_ui32(
+            static_cast<uint32_t>(bit_width), inner))) {
+        return ret;
+    }
+    if (RET_FAIL(common::SerializationUtil::write_ui32(
+            static_cast<uint32_t>(delta_arr_min_), inner))) {
+        return ret;
+    }
+    if (RET_FAIL(common::SerializationUtil::write_ui32(
+            static_cast<uint32_t>(first_value_), inner))) {
+        return ret;
+    }
+    for (int i = 0; i < write_index_; i++) {
+        write_bits(delta_arr_[i], bit_width, inner);
+    }
+    flush_remaining(inner);
+    reset();
+
+    constexpr uint32_t kJavaFloatTs2DiffOverflowMagic =
+        2147483646u;  // Java Integer.MAX_VALUE - 1
+    if (RET_FAIL(common::SerializationUtil::write_var_uint(
+            kJavaFloatTs2DiffOverflowMagic, out_stream))) {
+        return ret;
+    }
+    if (RET_FAIL(common::SerializationUtil::write_var_uint(
+            static_cast<uint32_t>(num_values), out_stream))) {
+        return ret;
+    }
+    int bm_len = num_values / 8 + 1;
+    std::vector<uint8_t> under(static_cast<size_t>(bm_len), 0);
+    std::vector<uint8_t> over(static_cast<size_t>(bm_len), 0);
+    for (int i = 0; i < num_values; i++) {
+        over[static_cast<size_t>(i / 8)] |= static_cast<uint8_t>(1u << (i % 8));
+    }
+    if (RET_FAIL(out_stream.write_buf(under.data(),
+                                      static_cast<uint32_t>(bm_len)))) {
+        return ret;
+    }
+    if (RET_FAIL(
+            out_stream.write_buf(over.data(), static_cast<uint32_t>(bm_len)))) {
+        return ret;
+    }
+    if (RET_FAIL(merge_byte_stream(out_stream, inner, true))) {
+        return ret;
+    }
+    return ret;
+}
+
+FORCE_INLINE int DoubleTS2DIFFEncoder::flush(common::ByteStream& out_stream) {
+    int ret = common::E_OK;
+    if (write_index_ == -1) {
+        return common::E_OK;
+    }
+    const int num_values = write_index_ + 1;
+    common::ByteStream inner(1024, common::MOD_TS2DIFF_OBJ, false);
+    if (RET_FAIL(common::SerializationUtil::write_var_uint(0u, inner))) {
+        return ret;
+    }
+    SIMDOps<int64_t>::rebase(delta_arr_, delta_arr_min_, write_index_);
+    int bit_width = cal_bit_width(delta_arr_max_ - delta_arr_min_);
+    if (RET_FAIL(common::SerializationUtil::write_i32(write_index_, inner))) {
+        return ret;
+    }
+    if (RET_FAIL(common::SerializationUtil::write_i32(bit_width, inner))) {
+        return ret;
+    }
+    if (RET_FAIL(common::SerializationUtil::write_i64(delta_arr_min_, inner))) {
+        return ret;
+    }
+    if (RET_FAIL(common::SerializationUtil::write_i64(first_value_, inner))) {
+        return ret;
+    }
+    for (int i = 0; i < write_index_; i++) {
+        write_bits(delta_arr_[i], bit_width, inner);
+    }
+    flush_remaining(inner);
+    reset();
+
+    constexpr uint32_t kJavaFloatTs2DiffOverflowMagic = 2147483646u;
+    if (RET_FAIL(common::SerializationUtil::write_var_uint(
+            kJavaFloatTs2DiffOverflowMagic, out_stream))) {
+        return ret;
+    }
+    if (RET_FAIL(common::SerializationUtil::write_var_uint(
+            static_cast<uint32_t>(num_values), out_stream))) {
+        return ret;
+    }
+    int bm_len = num_values / 8 + 1;
+    std::vector<uint8_t> under(static_cast<size_t>(bm_len), 0);
+    std::vector<uint8_t> over(static_cast<size_t>(bm_len), 0);
+    for (int i = 0; i < num_values; i++) {
+        over[static_cast<size_t>(i / 8)] |= static_cast<uint8_t>(1u << (i % 8));
+    }
+    if (RET_FAIL(out_stream.write_buf(under.data(),
+                                      static_cast<uint32_t>(bm_len)))) {
+        return ret;
+    }
+    if (RET_FAIL(
+            out_stream.write_buf(over.data(), static_cast<uint32_t>(bm_len)))) {
+        return ret;
+    }
+    if (RET_FAIL(merge_byte_stream(out_stream, inner, true))) {
+        return ret;
+    }
+    return ret;
+}
+
 }  // end namespace storage
 #endif  // ENCODING_TS2DIFF_ENCODER_H
diff --git a/cpp/test/CMakeLists.txt b/cpp/test/CMakeLists.txt
index 2be9c1b2c..9b84bf883 100644
--- a/cpp/test/CMakeLists.txt
+++ b/cpp/test/CMakeLists.txt
@@ -18,7 +18,6 @@ under the License.
 ]]
 cmake_minimum_required(VERSION 3.11)
 project(TsFile_CPP_TEST)
-include(FetchContent)
 
 set(CMAKE_VERBOSE_MAKEFILE ON)
 
@@ -33,36 +32,84 @@ set(DOWNLOADED 0)
 set(GTEST_URL "")
 set(TIMEOUT 30)
 
-if (EXISTS ${GTEST_ZIP_PATH})
+# Treat only a real ZIP as valid (local header magic PK\x03\x04 -> hex 504b0304).
+# EXISTS alone is wrong: failed downloads often leave a 0-byte file.
+# Do not use plain file(READ)+string LENGTH on binary: CMake may report length > LIMIT.
+set(GTEST_ZIP_LOCAL_VALID 0)
+if (EXISTS "${GTEST_ZIP_PATH}")
+    file(READ "${GTEST_ZIP_PATH}" GTEST_ZIP_HEX_PROBE LIMIT 4 HEX)
+    string(STRIP "${GTEST_ZIP_HEX_PROBE}" GTEST_ZIP_HEX_PROBE)
+    string(TOLOWER "${GTEST_ZIP_HEX_PROBE}" GTEST_ZIP_HEX_PROBE)
+    if (GTEST_ZIP_HEX_PROBE MATCHES "^504b03")
+        set(GTEST_ZIP_LOCAL_VALID 1)
+    else ()
+        message(
+                WARNING
+                "Local googletest zip is empty or not a zip (${GTEST_ZIP_PATH}); "
+                "will try download."
+        )
+        file(REMOVE "${GTEST_ZIP_PATH}")
+    endif ()
+endif ()
+
+if (GTEST_ZIP_LOCAL_VALID)
     message(STATUS "Using local gtest zip file: ${GTEST_ZIP_PATH}")
     set(DOWNLOADED 1)
     set(GTEST_URL ${GTEST_ZIP_PATH})
 else ()
-    message(STATUS "Local gtest zip file not found, trying to download from network...")
+    message(STATUS "Local gtest zip missing or invalid, trying to download from network...")
 endif ()
 
 if (NOT DOWNLOADED)
     foreach (URL ${GTEST_URL_LIST})
         message(STATUS "Trying to download from ${URL}")
-        file(DOWNLOAD ${URL} "${CMAKE_SOURCE_DIR}/third_party/googletest-release-1.12.1.zip" STATUS DOWNLOAD_STATUS TIMEOUT ${TIMEOUT})
+        file(DOWNLOAD ${URL} "${GTEST_ZIP_PATH}" STATUS DOWNLOAD_STATUS TIMEOUT
+                ${TIMEOUT})
 
         list(GET DOWNLOAD_STATUS 0 DOWNLOAD_RESULT)
-        if (${DOWNLOAD_RESULT} EQUAL 0)
-            set(DOWNLOADED 1)
-            set(GTEST_URL ${GTEST_ZIP_PATH})
-            break()
+        if (${DOWNLOAD_RESULT} EQUAL 0 AND EXISTS "${GTEST_ZIP_PATH}")
+            file(READ "${GTEST_ZIP_PATH}" GTEST_ZIP_HEX_PROBE LIMIT 4 HEX)
+            string(STRIP "${GTEST_ZIP_HEX_PROBE}" GTEST_ZIP_HEX_PROBE)
+            string(TOLOWER "${GTEST_ZIP_HEX_PROBE}" GTEST_ZIP_HEX_PROBE)
+            if (GTEST_ZIP_HEX_PROBE MATCHES "^504b03")
+                set(DOWNLOADED 1)
+                set(GTEST_URL ${GTEST_ZIP_PATH})
+                break()
+            else ()
+                message(WARNING "Download from ${URL} did not yield a valid zip; trying next URL...")
+                file(REMOVE "${GTEST_ZIP_PATH}")
+            endif ()
         endif ()
     endforeach ()
 endif ()
 
 if (${DOWNLOADED})
     message(STATUS "Successfully get googletest from ${GTEST_URL}")
-    FetchContent_Declare(
-            googletest
-            URL ${GTEST_URL}
-    )
     set(gtest_force_shared_crt ON CACHE BOOL "" FORCE)
-    FetchContent_MakeAvailable(googletest)
+    # Extract GitHub release zip via CMake (top folder googletest-release-1.12.1/).
+    # Avoid FetchContent here: deferred populate / wrong extract dir broke configure.
+    set(_gtest_stage "${CMAKE_BINARY_DIR}/googletest-extract")
+    set(GTEST_SRC_ROOT "${_gtest_stage}/googletest-release-1.12.1")
+    if (NOT EXISTS "${GTEST_SRC_ROOT}/CMakeLists.txt")
+        file(REMOVE_RECURSE "${_gtest_stage}")
+        file(MAKE_DIRECTORY "${_gtest_stage}")
+        execute_process(
+                COMMAND ${CMAKE_COMMAND} -E tar xf "${GTEST_ZIP_PATH}"
+                WORKING_DIRECTORY "${_gtest_stage}"
+                RESULT_VARIABLE _gtest_tar_result
+        )
+        if (NOT _gtest_tar_result EQUAL 0)
+            message(FATAL_ERROR "Failed to extract googletest zip: ${GTEST_ZIP_PATH}")
+        endif ()
+    endif ()
+    if (NOT EXISTS "${GTEST_SRC_ROOT}/CMakeLists.txt")
+        message(
+                FATAL_ERROR
+                "googletest zip layout unexpected (missing ${GTEST_SRC_ROOT}/CMakeLists.txt)."
+        )
+    endif ()
+    add_subdirectory("${GTEST_SRC_ROOT}" "${CMAKE_BINARY_DIR}/googletest-build"
+            EXCLUDE_FROM_ALL)
     set(TESTS_ENABLED ON PARENT_SCOPE)
 else ()
     message(WARNING "Failed to download googletest from all provided URLs, setting TESTS_ENABLED to OFF")
diff --git a/cpp/test/encoding/ts2diff_codec_test.cc b/cpp/test/encoding/ts2diff_codec_test.cc
index be16d4af2..bfa58b4e3 100644
--- a/cpp/test/encoding/ts2diff_codec_test.cc
+++ b/cpp/test/encoding/ts2diff_codec_test.cc
@@ -19,7 +19,10 @@
 #include <gtest/gtest.h>
 
 #include <bitset>
+#include <chrono>
+#include <cstring>
 #include <random>
+#include <vector>
 
 #include "encoding/ts2diff_decoder.h"
 #include "encoding/ts2diff_encoder.h"
@@ -59,6 +62,80 @@ class TS2DIFFCodecTest : public ::testing::Test {
     LongTS2DIFFDecoder* decoder_long_;
 };
 
+// Float/double TS_2DIFF: page layout must match Java FloatEncoder (overflow
+// flush) so cross-language readers see Float.intBitsToFloat values.
+class FloatDoubleTS2DIFFCodecTest : public ::testing::Test {
+   protected:
+    void SetUp() override {
+        encoder_float_ = new FloatTS2DIFFEncoder();
+        decoder_float_ = new FloatTS2DIFFDecoder();
+        encoder_double_ = new DoubleTS2DIFFEncoder();
+        decoder_double_ = new DoubleTS2DIFFDecoder();
+    }
+
+    void TearDown() override {
+        if (encoder_float_ != nullptr) {
+            encoder_float_->destroy();
+            delete encoder_float_;
+            encoder_float_ = nullptr;
+        }
+        if (encoder_double_ != nullptr) {
+            encoder_double_->destroy();
+            delete encoder_double_;
+            encoder_double_ = nullptr;
+        }
+        delete decoder_float_;
+        decoder_float_ = nullptr;
+        delete decoder_double_;
+        decoder_double_ = nullptr;
+    }
+
+    FloatTS2DIFFEncoder* encoder_float_{nullptr};
+    DoubleTS2DIFFEncoder* encoder_double_{nullptr};
+    FloatTS2DIFFDecoder* decoder_float_{nullptr};
+    DoubleTS2DIFFDecoder* decoder_double_{nullptr};
+};
+
+TEST_F(FloatDoubleTS2DIFFCodecTest, TestFloatRoundTrip) {
+    common::ByteStream out_stream(1024, common::MOD_TS2DIFF_OBJ, false);
+    const int row_num = 1000;
+    std::vector<float> data(row_num);
+    for (int i = 0; i < row_num; i++) {
+        data[i] = static_cast<float>(i) * 0.125f + 0.25f;
+    }
+    for (int i = 0; i < row_num; i++) {
+        EXPECT_EQ(encoder_float_->encode(data[i], out_stream), common::E_OK);
+    }
+    EXPECT_EQ(encoder_float_->flush(out_stream), common::E_OK);
+
+    float x = 0.f;
+    for (int i = 0; i < row_num; i++) {
+        EXPECT_EQ(decoder_float_->read_float(x, out_stream), common::E_OK);
+        EXPECT_FLOAT_EQ(x, data[i]) << "row " << i;
+    }
+    EXPECT_FALSE(decoder_float_->has_remaining(out_stream));
+}
+
+TEST_F(FloatDoubleTS2DIFFCodecTest, TestDoubleRoundTrip) {
+    common::ByteStream out_stream(1024, common::MOD_TS2DIFF_OBJ, false);
+    const int row_num = 800;
+    std::vector<double> data(row_num);
+    for (int i = 0; i < row_num; i++) {
+        data[i] = static_cast<double>(i) * 0.0625 + 0.5;
+    }
+    for (int i = 0; i < row_num; i++) {
+        EXPECT_EQ(encoder_double_->encode(data[i], out_stream), common::E_OK);
+    }
+    EXPECT_EQ(encoder_double_->flush(out_stream), common::E_OK);
+
+    double y = 0.;
+    for (int i = 0; i < row_num; i++) {
+        EXPECT_EQ(decoder_double_->read_double(y, out_stream), common::E_OK);
+        EXPECT_DOUBLE_EQ(y, data[i]) << "row " << i;
+    }
+    EXPECT_FALSE(decoder_double_->has_remaining(out_stream));
+}
+
 TEST_F(TS2DIFFCodecTest, TestIntEncoding1) {
     common::ByteStream out_stream(1024, common::MOD_TS2DIFF_OBJ, false);
     const int row_num = 10000;

From b0a4f9eb2c38cf8b16008712c084b0c7d215a8b5 Mon Sep 17 00:00:00 2001
From: 761417898 <761417898@qq.com>
Date: Thu, 30 Apr 2026 15:44:11 +0800
Subject: [PATCH 2/5] Make tsfile-cpp optimization flags inherit from caller by
 default.

Add optional TSFILE_OPTIMIZATION_FLAGS overrides in project/examples CMake while removing hardcoded optimization settings so library builds follow common CMake integration behavior.
---
 cpp/CMakeLists.txt          | 30 ++++++++++++++++++------------
 cpp/examples/CMakeLists.txt | 10 ++++++++--
 cpp/examples/README.md      |  8 ++++++++
 3 files changed, 34 insertions(+), 14 deletions(-)

diff --git a/cpp/CMakeLists.txt b/cpp/CMakeLists.txt
index 3f1d8bdd3..c5b10b35e 100755
--- a/cpp/CMakeLists.txt
+++ b/cpp/CMakeLists.txt
@@ -83,15 +83,24 @@ else ()
 endif ()
 
 message("CMAKE BUILD TYPE " ${CMAKE_BUILD_TYPE})
-if (CMAKE_BUILD_TYPE STREQUAL "Debug")
-    set(CMAKE_CXX_FLAGS_DEBUG "${CMAKE_CXX_FLAGS_DEBUG} -O0 -g")
-elseif (CMAKE_BUILD_TYPE STREQUAL "Release")
-    set(CMAKE_CXX_FLAGS_RELEASE "${CMAKE_CXX_FLAGS_RELEASE} -O2")
-elseif (CMAKE_BUILD_TYPE STREQUAL "RelWithDebInfo")
-    set(CMAKE_CXX_FLAGS_RELWITHDEBINFO "${CMAKE_CXX_FLAGS_RELWITHDEBINFO} -O2 -g")
-elseif (CMAKE_BUILD_TYPE STREQUAL "MinSizeRel")
-    set(CMAKE_CXX_FLAGS_MINSIZEREL "${CMAKE_CXX_FLAGS_MINSIZEREL} -ffunction-sections -fdata-sections -Os")
-    set(CMAKE_EXE_LINKER_FLAGS "${CMAKE_EXE_LINKER_FLAGS} -Wl,--gc-sections")
+# Keep optimization policy external by default (caller/toolchain/CMake defaults).
+set(TSFILE_OPTIMIZATION_FLAGS ""
+        CACHE STRING
+        "Optional extra optimization flags for tsfile-cpp (e.g. -O3). Empty means inherit caller defaults.")
+if (TSFILE_OPTIMIZATION_FLAGS)
+    # Apply after CMake defaults for each config so explicit optimization can
+    # override default -O flags in Release/RelWithDebInfo/Debug/MinSizeRel.
+    set(CMAKE_CXX_FLAGS_DEBUG
+            "${CMAKE_CXX_FLAGS_DEBUG} ${TSFILE_OPTIMIZATION_FLAGS}")
+    set(CMAKE_CXX_FLAGS_RELEASE
+            "${CMAKE_CXX_FLAGS_RELEASE} ${TSFILE_OPTIMIZATION_FLAGS}")
+    set(CMAKE_CXX_FLAGS_RELWITHDEBINFO
+            "${CMAKE_CXX_FLAGS_RELWITHDEBINFO} ${TSFILE_OPTIMIZATION_FLAGS}")
+    set(CMAKE_CXX_FLAGS_MINSIZEREL
+            "${CMAKE_CXX_FLAGS_MINSIZEREL} ${TSFILE_OPTIMIZATION_FLAGS}")
+    message("cmake using: TSFILE_OPTIMIZATION_FLAGS=${TSFILE_OPTIMIZATION_FLAGS}")
+else ()
+    message("cmake using: TSFILE_OPTIMIZATION_FLAGS=<inherit>")
 endif ()
 message("CMAKE DEBUG: CMAKE_CXX_FLAGS=${CMAKE_CXX_FLAGS}")
 
@@ -177,10 +186,7 @@ set(PROJECT_SRC_DIR ${PROJECT_SOURCE_DIR}/src)
 set(LIBRARY_INCLUDE_DIR ${PROJECT_BINARY_DIR}/include CACHE STRING "TsFile includes")
 set(THIRD_PARTY_INCLUDE ${PROJECT_BINARY_DIR}/third_party)
 
-set(SAVED_CXX_FLAGS "${CMAKE_CXX_FLAGS}")
-set(CMAKE_CXX_FLAGS "$ENV{CXXFLAGS} -Wall -std=c++11")
 add_subdirectory(third_party)
-set(CMAKE_CXX_FLAGS "${SAVED_CXX_FLAGS}")
 
 add_subdirectory(src)
 if (BUILD_TEST)
diff --git a/cpp/examples/CMakeLists.txt b/cpp/examples/CMakeLists.txt
index ebe6c66c8..308e285bb 100644
--- a/cpp/examples/CMakeLists.txt
+++ b/cpp/examples/CMakeLists.txt
@@ -21,6 +21,7 @@ project(examples)
 message("Running in exampes directory")
 
 set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -std=c++11")
+set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -std=c11")
 
 # TsFile include dir
 set(SDK_INCLUDE_DIR ${PROJECT_SOURCE_DIR}/../src/)
@@ -37,8 +38,13 @@ include_directories(${PROJECT_SOURCE_DIR}/../third_party/antlr4-cpp-runtime-4/ru
 set(BUILD_TYPE "Release")
 include_directories(${SDK_INCLUDE_DIR})
 
-set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -O0 -g")
-set(CMAKE_CXX_FLAGS_DEBUG" ${CMAKE_CXX_FLAGS} -O0 -g")
+if (DEFINED TSFILE_OPTIMIZATION_FLAGS AND NOT "${TSFILE_OPTIMIZATION_FLAGS}" STREQUAL "")
+    set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} ${TSFILE_OPTIMIZATION_FLAGS}")
+    set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${TSFILE_OPTIMIZATION_FLAGS}")
+    message("examples using: TSFILE_OPTIMIZATION_FLAGS=${TSFILE_OPTIMIZATION_FLAGS}")
+else ()
+    message("examples using: TSFILE_OPTIMIZATION_FLAGS=<inherit>")
+endif ()
 
 add_subdirectory(cpp_examples)
 add_subdirectory(c_examples)
diff --git a/cpp/examples/README.md b/cpp/examples/README.md
index 5f5af186a..5503eb6f3 100644
--- a/cpp/examples/README.md
+++ b/cpp/examples/README.md
@@ -55,6 +55,14 @@ target_link_libraries(your_target ${TSFILE_LIB})
 
 Note: Set ${SDK_LIB} to your TSFile library directory.
 
+### Optional Optimization Control
+
+By default, `tsfile-cpp` inherits optimization settings from the caller/toolchain.
+If you want to override optimization for `tsfile-cpp`, pass
+`TSFILE_OPTIMIZATION_FLAGS` during configure:
+
+Leave `TSFILE_OPTIMIZATION_FLAGS` empty to keep inherited behavior.
+
 ## 3. Implementation Examples
    
 ### Directory Structure

From 13bb80e91792e5e4c1a517e613cde8939473ba5e Mon Sep 17 00:00:00 2001
From: 761417898 <761417898@qq.com>
Date: Thu, 30 Apr 2026 16:04:13 +0800
Subject: [PATCH 3/5] Align C++ float/double TS_2DIFF default semantics with
 Java.

Use Java-compatible default maxPoint handling for float/double TS_2DIFF encode/decode while preserving legacy raw-block compatibility, and add a byte-level regression test for the documented float/NaN hex sequence.
---
 cpp/src/encoding/ts2diff_decoder.h      | 169 ++++++++++++++++--
 cpp/src/encoding/ts2diff_encoder.h      | 219 ++++++++++++++++++------
 cpp/test/encoding/ts2diff_codec_test.cc |  42 ++++-
 3 files changed, 360 insertions(+), 70 deletions(-)

diff --git a/cpp/src/encoding/ts2diff_decoder.h b/cpp/src/encoding/ts2diff_decoder.h
index 258f04337..416cfa3de 100644
--- a/cpp/src/encoding/ts2diff_decoder.h
+++ b/cpp/src/encoding/ts2diff_decoder.h
@@ -22,7 +22,9 @@
 
 #include <sys/types.h>
 
+#include <cmath>
 #include <cstddef>
+#include <vector>
 
 #include "common/allocator/alloc_base.h"
 #include "common/allocator/byte_stream.h"
@@ -37,30 +39,95 @@ namespace ts2diff_java_detail {
 // then reads BitMaps and Float.intBitsToFloat for float/double TS_2DIFF pages.
 constexpr uint32_t kJavaFloatTs2DiffOverflowMagic =
     2147483646u;  // Integer.MAX_VALUE - 1
+constexpr uint32_t kJavaFloatTs2DiffUnderflowMagic =
+    2147483647u;  // Integer.MAX_VALUE
 
-inline int consume_float_double_ts2diff_prefix(common::ByteStream& in) {
+inline bool bitmap_marked(const std::vector<uint8_t>& bm, int idx) {
+    if (bm.empty()) {
+        return false;
+    }
+    size_t byte_idx = static_cast<size_t>(idx / 8);
+    if (byte_idx >= bm.size()) {
+        return false;
+    }
+    return (bm[byte_idx] & static_cast<uint8_t>(1u << (idx % 8))) != 0;
+}
+
+inline bool looks_like_ts2diff_header(common::ByteStream& in) {
     int ret = common::E_OK;
+    uint32_t probe_mark = in.read_pos();
+    int32_t write_index = 0;
+    int32_t bit_width = 0;
+    if (RET_FAIL(common::SerializationUtil::read_i32(write_index, in)) ||
+        RET_FAIL(common::SerializationUtil::read_i32(bit_width, in))) {
+        in.set_read_pos(probe_mark);
+        return false;
+    }
+    in.set_read_pos(probe_mark);
+    if (write_index < 0 || write_index > 128) {
+        return false;
+    }
+    if (bit_width < 0 || bit_width > 64) {
+        return false;
+    }
+    return true;
+}
+
+inline int consume_float_double_ts2diff_prefix(
+    common::ByteStream& in, bool& is_legacy_raw, int& max_point_number,
+    std::vector<uint8_t>& underflow_bm, std::vector<uint8_t>& value_overflow_bm,
+    int& segment_size) {
+    int ret = common::E_OK;
+    is_legacy_raw = false;
+    max_point_number = 0;
+    underflow_bm.clear();
+    value_overflow_bm.clear();
+    segment_size = 0;
     uint32_t mark = in.read_pos();
     uint32_t tag = 0;
     if (RET_FAIL(common::SerializationUtil::read_var_uint(tag, in))) {
         return ret;
     }
-    if (tag == kJavaFloatTs2DiffOverflowMagic) {
+    if (tag == kJavaFloatTs2DiffOverflowMagic ||
+        tag == kJavaFloatTs2DiffUnderflowMagic) {
         uint32_t n = 0;
         if (RET_FAIL(common::SerializationUtil::read_var_uint(n, in))) {
             return ret;
         }
-        int bm_len = static_cast<int>(n) / 8 + 1;
-        uint32_t skip_to = in.read_pos() + static_cast<uint32_t>(bm_len * 2);
-        in.set_read_pos(skip_to);
-        uint32_t inner_max_point = 0;
-        if (RET_FAIL(common::SerializationUtil::read_var_uint(inner_max_point,
-                                                              in))) {
+        segment_size = static_cast<int>(n);
+        int bm_len = segment_size / 8 + 1;
+        underflow_bm.resize(static_cast<size_t>(bm_len), 0);
+        uint32_t read_len = 0;
+        if (RET_FAIL(in.read_buf(underflow_bm.data(),
+                                 static_cast<uint32_t>(bm_len), read_len)) ||
+            read_len != static_cast<uint32_t>(bm_len)) {
             return ret;
         }
-        (void)inner_max_point;
-    } else {
+        if (tag == kJavaFloatTs2DiffOverflowMagic) {
+            value_overflow_bm.resize(static_cast<size_t>(bm_len), 0);
+            if (RET_FAIL(in.read_buf(value_overflow_bm.data(),
+                                     static_cast<uint32_t>(bm_len),
+                                     read_len)) ||
+                read_len != static_cast<uint32_t>(bm_len)) {
+                return ret;
+            }
+        }
+        uint32_t mpn = 0;
+        if (RET_FAIL(common::SerializationUtil::read_var_uint(mpn, in))) {
+            return ret;
+        }
+        max_point_number = static_cast<int>(mpn);
+        return common::E_OK;
+    }
+
+    // Possible non-overflow Java-style prefix (maxPointNumber) OR legacy raw
+    // C++ TS_2DIFF block (no prefix). Probe header to distinguish.
+    max_point_number = static_cast<int>(tag);
+    if (!looks_like_ts2diff_header(in)) {
         in.set_read_pos(mark);
+        is_legacy_raw = true;
+    } else {
+        segment_size = 0;  // unknown; determined by TS2DIFF block header
     }
     return common::E_OK;
 }
@@ -211,6 +278,7 @@ inline int64_t TS2DIFFDecoder<int64_t>::decode(common::ByteStream& in) {
 
 class FloatTS2DIFFDecoder : public TS2DIFFDecoder<int32_t> {
    public:
+    FloatTS2DIFFDecoder() = default;
     float decode(common::ByteStream& in) {
         int32_t value_int = TS2DIFFDecoder<int32_t>::decode(in);
         return common::int_to_float(value_int);
@@ -221,10 +289,20 @@ class FloatTS2DIFFDecoder : public TS2DIFFDecoder<int32_t> {
     int read_int64(int64_t& ret_value, common::ByteStream& in);
     int read_float(float& ret_value, common::ByteStream& in);
     int read_double(double& ret_value, common::ByteStream& in);
+
+   private:
+    bool is_legacy_raw_{false};
+    int max_point_number_{0};
+    double max_point_value_{1.0};
+    int segment_pos_{0};
+    int segment_size_{0};
+    std::vector<uint8_t> underflow_bm_;
+    std::vector<uint8_t> value_overflow_bm_;
 };
 
 class DoubleTS2DIFFDecoder : public TS2DIFFDecoder<int64_t> {
    public:
+    DoubleTS2DIFFDecoder() = default;
     double decode(common::ByteStream& in) {
         int64_t value_long = TS2DIFFDecoder<int64_t>::decode(in);
         return common::long_to_double(value_long);
@@ -235,6 +313,15 @@ class DoubleTS2DIFFDecoder : public TS2DIFFDecoder<int64_t> {
     int read_int64(int64_t& ret_value, common::ByteStream& in);
     int read_float(float& ret_value, common::ByteStream& in);
     int read_double(double& ret_value, common::ByteStream& in);
+
+   private:
+    bool is_legacy_raw_{false};
+    int max_point_number_{0};
+    double max_point_value_{1.0};
+    int segment_pos_{0};
+    int segment_size_{0};
+    std::vector<uint8_t> underflow_bm_;
+    std::vector<uint8_t> value_overflow_bm_;
 };
 
 typedef TS2DIFFDecoder<int32_t> IntTS2DIFFDecoder;
@@ -333,16 +420,37 @@ FORCE_INLINE int FloatTS2DIFFDecoder::read_int64(int64_t& ret_value,
 FORCE_INLINE int FloatTS2DIFFDecoder::read_float(float& ret_value,
                                                  common::ByteStream& in) {
     int ret = common::E_OK;
-    // Each encoder flush() emits a self-contained Java-compatible segment.
-    // TS_2DIFFDecoder resets current_index_ to 0 at block boundaries; align
-    // the outer FloatEncoder wrapper before reading each new inner block.
     if (current_index_ == 0) {
-        if (RET_FAIL(
-                ts2diff_java_detail::consume_float_double_ts2diff_prefix(in))) {
+        if (RET_FAIL(ts2diff_java_detail::consume_float_double_ts2diff_prefix(
+                in, is_legacy_raw_, max_point_number_, underflow_bm_,
+                value_overflow_bm_, segment_size_))) {
             return ret;
         }
+        max_point_value_ =
+            max_point_number_ <= 0
+                ? 1.0
+                : std::pow(10.0, static_cast<double>(max_point_number_));
+        segment_pos_ = 0;
     }
-    ret_value = decode(in);
+    if (is_legacy_raw_) {
+        ret_value = decode(in);
+        return common::E_OK;
+    }
+    int32_t value_int = TS2DIFFDecoder<int32_t>::decode(in);
+    if (!value_overflow_bm_.empty() &&
+        ts2diff_java_detail::bitmap_marked(value_overflow_bm_, segment_pos_)) {
+        ret_value = common::int_to_float(value_int);
+    } else {
+        bool use_scaled = true;
+        if (!underflow_bm_.empty()) {
+            use_scaled =
+                ts2diff_java_detail::bitmap_marked(underflow_bm_, segment_pos_);
+        }
+        const double divisor = use_scaled ? max_point_value_ : 1.0;
+        ret_value =
+            static_cast<float>(static_cast<double>(value_int) / divisor);
+    }
+    segment_pos_++;
     return common::E_OK;
 }
 FORCE_INLINE int FloatTS2DIFFDecoder::read_double(double& ret_value,
@@ -374,12 +482,35 @@ FORCE_INLINE int DoubleTS2DIFFDecoder::read_double(double& ret_value,
                                                    common::ByteStream& in) {
     int ret = common::E_OK;
     if (current_index_ == 0) {
-        if (RET_FAIL(
-                ts2diff_java_detail::consume_float_double_ts2diff_prefix(in))) {
+        if (RET_FAIL(ts2diff_java_detail::consume_float_double_ts2diff_prefix(
+                in, is_legacy_raw_, max_point_number_, underflow_bm_,
+                value_overflow_bm_, segment_size_))) {
             return ret;
         }
+        max_point_value_ =
+            max_point_number_ <= 0
+                ? 1.0
+                : std::pow(10.0, static_cast<double>(max_point_number_));
+        segment_pos_ = 0;
     }
-    ret_value = decode(in);
+    if (is_legacy_raw_) {
+        ret_value = decode(in);
+        return common::E_OK;
+    }
+    int64_t value_long = TS2DIFFDecoder<int64_t>::decode(in);
+    if (!value_overflow_bm_.empty() &&
+        ts2diff_java_detail::bitmap_marked(value_overflow_bm_, segment_pos_)) {
+        ret_value = common::long_to_double(value_long);
+    } else {
+        bool use_scaled = true;
+        if (!underflow_bm_.empty()) {
+            use_scaled =
+                ts2diff_java_detail::bitmap_marked(underflow_bm_, segment_pos_);
+        }
+        const double divisor = use_scaled ? max_point_value_ : 1.0;
+        ret_value = static_cast<double>(value_long) / divisor;
+    }
+    segment_pos_++;
     return common::E_OK;
 }
 
diff --git a/cpp/src/encoding/ts2diff_encoder.h b/cpp/src/encoding/ts2diff_encoder.h
index bd51d2cc9..a94b6b57e 100644
--- a/cpp/src/encoding/ts2diff_encoder.h
+++ b/cpp/src/encoding/ts2diff_encoder.h
@@ -22,6 +22,8 @@
 
 #include <sys/types.h>
 
+#include <cmath>
+#include <limits>
 #include <vector>
 
 #include "common/allocator/alloc_base.h"
@@ -273,8 +275,9 @@ inline int TS2DIFFEncoder<int64_t>::flush(common::ByteStream& out_stream) {
 
 class FloatTS2DIFFEncoder : public TS2DIFFEncoder<int32_t> {
    public:
+    FloatTS2DIFFEncoder() : max_point_number_(2), max_point_value_(100.0) {}
     int do_encode(float value, common::ByteStream& out_stream) {
-        int32_t value_int = common::float_to_int(value);
+        int32_t value_int = convert_float_to_int(value);
         return TS2DIFFEncoder<int32_t>::do_encode(value_int, out_stream);
     }
     int flush(common::ByteStream& out_stream) override;
@@ -283,12 +286,52 @@ class FloatTS2DIFFEncoder : public TS2DIFFEncoder<int32_t> {
     int encode(int64_t value, common::ByteStream& out_stream);
     int encode(float value, common::ByteStream& out_stream);
     int encode(double value, common::ByteStream& out_stream);
+
+   private:
+    int32_t convert_float_to_int(float value) {
+        const double scaled = static_cast<double>(value) * max_point_value_;
+        if (scaled > static_cast<double>(std::numeric_limits<int32_t>::max()) ||
+            scaled < static_cast<double>(std::numeric_limits<int32_t>::min())) {
+            if (std::isnan(value) ||
+                value >
+                    static_cast<float>(std::numeric_limits<int32_t>::max()) ||
+                value <
+                    static_cast<float>(std::numeric_limits<int32_t>::min())) {
+                underflow_flags_.push_back(-1);  // value itself overflow
+                return common::float_to_int(value);
+            }
+            underflow_flags_.push_back(
+                0);  // scaled overflow, keep rounded value
+            return static_cast<int32_t>(std::lround(value));
+        }
+        if (std::isnan(value)) {
+            underflow_flags_.push_back(-1);
+            return common::float_to_int(value);
+        }
+        underflow_flags_.push_back(
+            1);  // scaled and will divide by max_point_value_
+        return static_cast<int32_t>(std::lround(scaled));
+    }
+    bool has_overflow() const {
+        for (int8_t f : underflow_flags_) {
+            if (f != 1) {
+                return true;
+            }
+        }
+        return false;
+    }
+
+   private:
+    int max_point_number_;
+    double max_point_value_;
+    std::vector<int8_t> underflow_flags_;
 };
 
 class DoubleTS2DIFFEncoder : public TS2DIFFEncoder<int64_t> {
    public:
+    DoubleTS2DIFFEncoder() : max_point_number_(2), max_point_value_(100.0) {}
     int do_encode(double value, common::ByteStream& out_stream) {
-        int64_t value_long = common::double_to_long(value);
+        int64_t value_long = convert_double_to_long(value);
         return TS2DIFFEncoder<int64_t>::do_encode(value_long, out_stream);
     }
     int flush(common::ByteStream& out_stream) override;
@@ -297,6 +340,45 @@ class DoubleTS2DIFFEncoder : public TS2DIFFEncoder<int64_t> {
     int encode(int64_t value, common::ByteStream& out_stream);
     int encode(float value, common::ByteStream& out_stream);
     int encode(double value, common::ByteStream& out_stream);
+
+   private:
+    int64_t convert_double_to_long(double value) {
+        const double scaled = value * max_point_value_;
+        if (scaled > static_cast<double>(std::numeric_limits<int64_t>::max()) ||
+            scaled < static_cast<double>(std::numeric_limits<int64_t>::min())) {
+            if (std::isnan(value) ||
+                value >
+                    static_cast<double>(std::numeric_limits<int64_t>::max()) ||
+                value <
+                    static_cast<double>(std::numeric_limits<int64_t>::min())) {
+                underflow_flags_.push_back(-1);  // value itself overflow
+                return common::double_to_long(value);
+            }
+            underflow_flags_.push_back(
+                0);  // scaled overflow, keep rounded value
+            return static_cast<int64_t>(std::llround(value));
+        }
+        if (std::isnan(value)) {
+            underflow_flags_.push_back(-1);
+            return common::double_to_long(value);
+        }
+        underflow_flags_.push_back(
+            1);  // scaled and will divide by max_point_value_
+        return static_cast<int64_t>(std::llround(scaled));
+    }
+    bool has_overflow() const {
+        for (int8_t f : underflow_flags_) {
+            if (f != 1) {
+                return true;
+            }
+        }
+        return false;
+    }
+
+   private:
+    int max_point_number_;
+    double max_point_value_;
+    std::vector<int8_t> underflow_flags_;
 };
 
 typedef TS2DIFFEncoder<int32_t> IntTS2DIFFEncoder;
@@ -416,7 +498,8 @@ FORCE_INLINE int FloatTS2DIFFEncoder::flush(common::ByteStream& out_stream) {
     }
     const int num_values = write_index_ + 1;
     common::ByteStream inner(1024, common::MOD_TS2DIFF_OBJ, false);
-    if (RET_FAIL(common::SerializationUtil::write_var_uint(0u, inner))) {
+    if (RET_FAIL(common::SerializationUtil::write_var_uint(
+            static_cast<uint32_t>(max_point_number_), inner))) {
         return ret;
     }
     SIMDOps<int32_t>::rebase(delta_arr_, delta_arr_min_, write_index_);
@@ -443,33 +526,51 @@ FORCE_INLINE int FloatTS2DIFFEncoder::flush(common::ByteStream& out_stream) {
     flush_remaining(inner);
     reset();
 
-    constexpr uint32_t kJavaFloatTs2DiffOverflowMagic =
-        2147483646u;  // Java Integer.MAX_VALUE - 1
-    if (RET_FAIL(common::SerializationUtil::write_var_uint(
-            kJavaFloatTs2DiffOverflowMagic, out_stream))) {
-        return ret;
-    }
-    if (RET_FAIL(common::SerializationUtil::write_var_uint(
-            static_cast<uint32_t>(num_values), out_stream))) {
-        return ret;
-    }
-    int bm_len = num_values / 8 + 1;
-    std::vector<uint8_t> under(static_cast<size_t>(bm_len), 0);
-    std::vector<uint8_t> over(static_cast<size_t>(bm_len), 0);
-    for (int i = 0; i < num_values; i++) {
-        over[static_cast<size_t>(i / 8)] |= static_cast<uint8_t>(1u << (i % 8));
-    }
-    if (RET_FAIL(out_stream.write_buf(under.data(),
-                                      static_cast<uint32_t>(bm_len)))) {
-        return ret;
-    }
-    if (RET_FAIL(
-            out_stream.write_buf(over.data(), static_cast<uint32_t>(bm_len)))) {
-        return ret;
+    const bool overflow = has_overflow();
+    if (overflow) {
+        std::vector<uint8_t> underflow_bitmap(
+            static_cast<size_t>(num_values / 8 + 1), 0);
+        std::vector<uint8_t> value_overflow_bitmap(
+            static_cast<size_t>(num_values / 8 + 1), 0);
+        bool has_value_overflow = false;
+        for (int i = 0; i < num_values; i++) {
+            int8_t f = underflow_flags_[static_cast<size_t>(i)];
+            if (f == 1) {
+                underflow_bitmap[static_cast<size_t>(i / 8)] |=
+                    static_cast<uint8_t>(1u << (i % 8));
+            } else if (f == -1) {
+                has_value_overflow = true;
+                value_overflow_bitmap[static_cast<size_t>(i / 8)] |=
+                    static_cast<uint8_t>(1u << (i % 8));
+            }
+        }
+        constexpr uint32_t kJavaOverflowMagic =
+            2147483647u;  // Integer.MAX_VALUE
+        constexpr uint32_t kJavaValueOverflowMagic =
+            2147483646u;  // Integer.MAX_VALUE - 1
+        if (RET_FAIL(common::SerializationUtil::write_var_uint(
+                has_value_overflow ? kJavaValueOverflowMagic
+                                   : kJavaOverflowMagic,
+                out_stream))) {
+            return ret;
+        }
+        if (RET_FAIL(common::SerializationUtil::write_var_uint(
+                static_cast<uint32_t>(num_values), out_stream))) {
+            return ret;
+        }
+        const uint32_t bm_len = static_cast<uint32_t>(num_values / 8 + 1);
+        if (RET_FAIL(out_stream.write_buf(underflow_bitmap.data(), bm_len))) {
+            return ret;
+        }
+        if (has_value_overflow && RET_FAIL(out_stream.write_buf(
+                                      value_overflow_bitmap.data(), bm_len))) {
+            return ret;
+        }
     }
     if (RET_FAIL(merge_byte_stream(out_stream, inner, true))) {
         return ret;
     }
+    underflow_flags_.clear();
     return ret;
 }
 
@@ -480,7 +581,8 @@ FORCE_INLINE int DoubleTS2DIFFEncoder::flush(common::ByteStream& out_stream) {
     }
     const int num_values = write_index_ + 1;
     common::ByteStream inner(1024, common::MOD_TS2DIFF_OBJ, false);
-    if (RET_FAIL(common::SerializationUtil::write_var_uint(0u, inner))) {
+    if (RET_FAIL(common::SerializationUtil::write_var_uint(
+            static_cast<uint32_t>(max_point_number_), inner))) {
         return ret;
     }
     SIMDOps<int64_t>::rebase(delta_arr_, delta_arr_min_, write_index_);
@@ -503,32 +605,51 @@ FORCE_INLINE int DoubleTS2DIFFEncoder::flush(common::ByteStream& out_stream) {
     flush_remaining(inner);
     reset();
 
-    constexpr uint32_t kJavaFloatTs2DiffOverflowMagic = 2147483646u;
-    if (RET_FAIL(common::SerializationUtil::write_var_uint(
-            kJavaFloatTs2DiffOverflowMagic, out_stream))) {
-        return ret;
-    }
-    if (RET_FAIL(common::SerializationUtil::write_var_uint(
-            static_cast<uint32_t>(num_values), out_stream))) {
-        return ret;
-    }
-    int bm_len = num_values / 8 + 1;
-    std::vector<uint8_t> under(static_cast<size_t>(bm_len), 0);
-    std::vector<uint8_t> over(static_cast<size_t>(bm_len), 0);
-    for (int i = 0; i < num_values; i++) {
-        over[static_cast<size_t>(i / 8)] |= static_cast<uint8_t>(1u << (i % 8));
-    }
-    if (RET_FAIL(out_stream.write_buf(under.data(),
-                                      static_cast<uint32_t>(bm_len)))) {
-        return ret;
-    }
-    if (RET_FAIL(
-            out_stream.write_buf(over.data(), static_cast<uint32_t>(bm_len)))) {
-        return ret;
+    const bool overflow = has_overflow();
+    if (overflow) {
+        std::vector<uint8_t> underflow_bitmap(
+            static_cast<size_t>(num_values / 8 + 1), 0);
+        std::vector<uint8_t> value_overflow_bitmap(
+            static_cast<size_t>(num_values / 8 + 1), 0);
+        bool has_value_overflow = false;
+        for (int i = 0; i < num_values; i++) {
+            int8_t f = underflow_flags_[static_cast<size_t>(i)];
+            if (f == 1) {
+                underflow_bitmap[static_cast<size_t>(i / 8)] |=
+                    static_cast<uint8_t>(1u << (i % 8));
+            } else if (f == -1) {
+                has_value_overflow = true;
+                value_overflow_bitmap[static_cast<size_t>(i / 8)] |=
+                    static_cast<uint8_t>(1u << (i % 8));
+            }
+        }
+        constexpr uint32_t kJavaOverflowMagic =
+            2147483647u;  // Integer.MAX_VALUE
+        constexpr uint32_t kJavaValueOverflowMagic =
+            2147483646u;  // Integer.MAX_VALUE - 1
+        if (RET_FAIL(common::SerializationUtil::write_var_uint(
+                has_value_overflow ? kJavaValueOverflowMagic
+                                   : kJavaOverflowMagic,
+                out_stream))) {
+            return ret;
+        }
+        if (RET_FAIL(common::SerializationUtil::write_var_uint(
+                static_cast<uint32_t>(num_values), out_stream))) {
+            return ret;
+        }
+        const uint32_t bm_len = static_cast<uint32_t>(num_values / 8 + 1);
+        if (RET_FAIL(out_stream.write_buf(underflow_bitmap.data(), bm_len))) {
+            return ret;
+        }
+        if (has_value_overflow && RET_FAIL(out_stream.write_buf(
+                                      value_overflow_bitmap.data(), bm_len))) {
+            return ret;
+        }
     }
     if (RET_FAIL(merge_byte_stream(out_stream, inner, true))) {
         return ret;
     }
+    underflow_flags_.clear();
     return ret;
 }
 
diff --git a/cpp/test/encoding/ts2diff_codec_test.cc b/cpp/test/encoding/ts2diff_codec_test.cc
index bfa58b4e3..317773d92 100644
--- a/cpp/test/encoding/ts2diff_codec_test.cc
+++ b/cpp/test/encoding/ts2diff_codec_test.cc
@@ -20,8 +20,11 @@
 
 #include <bitset>
 #include <chrono>
+#include <cmath>
 #include <cstring>
+#include <iomanip>
 #include <random>
+#include <sstream>
 #include <vector>
 
 #include "encoding/ts2diff_decoder.h"
@@ -96,12 +99,32 @@ class FloatDoubleTS2DIFFCodecTest : public ::testing::Test {
     DoubleTS2DIFFDecoder* decoder_double_{nullptr};
 };
 
+static std::string byte_stream_to_hex(common::ByteStream& stream) {
+    uint32_t mark = stream.read_pos();
+    uint32_t size = stream.total_size();
+    std::vector<uint8_t> buf(size);
+    uint32_t read_len = 0;
+    EXPECT_EQ(stream.read_buf(buf.data(), size, read_len), common::E_OK);
+    EXPECT_EQ(read_len, size);
+    stream.set_read_pos(mark);
+
+    std::ostringstream oss;
+    for (uint32_t i = 0; i < size; i++) {
+        if (i > 0) {
+            oss << " ";
+        }
+        oss << std::uppercase << std::hex << std::setw(2) << std::setfill('0')
+            << static_cast<unsigned>(buf[i]);
+    }
+    return oss.str();
+}
+
 TEST_F(FloatDoubleTS2DIFFCodecTest, TestFloatRoundTrip) {
     common::ByteStream out_stream(1024, common::MOD_TS2DIFF_OBJ, false);
     const int row_num = 1000;
     std::vector<float> data(row_num);
     for (int i = 0; i < row_num; i++) {
-        data[i] = static_cast<float>(i) * 0.125f + 0.25f;
+        data[i] = static_cast<float>(i) * 0.25f + 0.50f;
     }
     for (int i = 0; i < row_num; i++) {
         EXPECT_EQ(encoder_float_->encode(data[i], out_stream), common::E_OK);
@@ -116,12 +139,27 @@ TEST_F(FloatDoubleTS2DIFFCodecTest, TestFloatRoundTrip) {
     EXPECT_FALSE(decoder_float_->has_remaining(out_stream));
 }
 
+TEST_F(FloatDoubleTS2DIFFCodecTest, TestFloatJavaDefaultHexCompatibility) {
+    common::ByteStream out_stream(1024, common::MOD_TS2DIFF_OBJ, false);
+    const float data[] = {3.123456768E20f, std::nanf("")};
+
+    for (float v : data) {
+        EXPECT_EQ(encoder_float_->encode(v, out_stream), common::E_OK);
+    }
+    EXPECT_EQ(encoder_float_->flush(out_stream), common::E_OK);
+
+    const std::string expected_hex =
+        "FE FF FF FF 07 02 00 03 02 00 00 00 01 00 00 00 00 1E 38 8A AA 61 87 "
+        "75 56";
+    EXPECT_EQ(byte_stream_to_hex(out_stream), expected_hex);
+}
+
 TEST_F(FloatDoubleTS2DIFFCodecTest, TestDoubleRoundTrip) {
     common::ByteStream out_stream(1024, common::MOD_TS2DIFF_OBJ, false);
     const int row_num = 800;
     std::vector<double> data(row_num);
     for (int i = 0; i < row_num; i++) {
-        data[i] = static_cast<double>(i) * 0.0625 + 0.5;
+        data[i] = static_cast<double>(i) * 0.25 + 0.5;
     }
     for (int i = 0; i < row_num; i++) {
         EXPECT_EQ(encoder_double_->encode(data[i], out_stream), common::E_OK);

From fa396502e2dc8d2c51c70ebe825dd39eba3b69d3 Mon Sep 17 00:00:00 2001
From: 761417898 <761417898@qq.com>
Date: Thu, 30 Apr 2026 17:39:22 +0800
Subject: [PATCH 4/5] Fix table time decoder selection for chunk readers.

Use the actual time chunk encoding instead of global default when building time decoders in table read paths, preventing wrong TS_2DIFF decoding on PLAIN time chunks.
---
 .../org/apache/tsfile/read/TsFileSequenceReader.java | 12 ++++++++----
 .../reader/chunk/AbstractAlignedChunkReader.java     |  2 +-
 .../read/reader/chunk/AbstractChunkReader.java       |  4 ++++
 .../apache/tsfile/read/reader/chunk/ChunkReader.java |  2 +-
 4 files changed, 14 insertions(+), 6 deletions(-)

diff --git a/java/tsfile/src/main/java/org/apache/tsfile/read/TsFileSequenceReader.java b/java/tsfile/src/main/java/org/apache/tsfile/read/TsFileSequenceReader.java
index 481a4d6c2..69aded79d 100644
--- a/java/tsfile/src/main/java/org/apache/tsfile/read/TsFileSequenceReader.java
+++ b/java/tsfile/src/main/java/org/apache/tsfile/read/TsFileSequenceReader.java
@@ -2433,11 +2433,15 @@ public long selfCheck(
                     Decoder.getDecoderByType(
                         chunkHeader.getEncodingType(), chunkHeader.getDataType());
                 ByteBuffer pageData = readPage(pageHeader, chunkHeader.getCompressionType());
+                TSEncoding configuredTimeEncoding =
+                    TSEncoding.valueOf(TSFileDescriptor.getInstance().getConfig().getTimeEncoder());
+                boolean isTimeColumn =
+                    (chunkHeader.getChunkType() & TsFileConstant.TIME_COLUMN_MASK)
+                        == TsFileConstant.TIME_COLUMN_MASK;
+                TSEncoding selectedTimeEncoding =
+                    isTimeColumn ? chunkHeader.getEncodingType() : configuredTimeEncoding;
                 Decoder timeDecoder =
-                    Decoder.getDecoderByType(
-                        TSEncoding.valueOf(
-                            TSFileDescriptor.getInstance().getConfig().getTimeEncoder()),
-                        TSDataType.INT64);
+                    Decoder.getDecoderByType(selectedTimeEncoding, TSDataType.INT64);
 
                 if ((chunkHeader.getChunkType() & TsFileConstant.TIME_COLUMN_MASK)
                     == TsFileConstant.TIME_COLUMN_MASK) { // Time Chunk with only one page
diff --git a/java/tsfile/src/main/java/org/apache/tsfile/read/reader/chunk/AbstractAlignedChunkReader.java b/java/tsfile/src/main/java/org/apache/tsfile/read/reader/chunk/AbstractAlignedChunkReader.java
index 85073a456..acc9789e4 100644
--- a/java/tsfile/src/main/java/org/apache/tsfile/read/reader/chunk/AbstractAlignedChunkReader.java
+++ b/java/tsfile/src/main/java/org/apache/tsfile/read/reader/chunk/AbstractAlignedChunkReader.java
@@ -250,7 +250,7 @@ private AbstractAlignedPageReader constructAlignedPageReader(
     return constructPageReader(
         timePageHeader,
         timePageData,
-        defaultTimeDecoder,
+        getTimeDecoder(timeChunkHeader.getEncodingType()),
         valuePageHeaderList,
         lazyLoadPageDataArray,
         valueDataTypeList,
diff --git a/java/tsfile/src/main/java/org/apache/tsfile/read/reader/chunk/AbstractChunkReader.java b/java/tsfile/src/main/java/org/apache/tsfile/read/reader/chunk/AbstractChunkReader.java
index caaa58751..5defe047d 100644
--- a/java/tsfile/src/main/java/org/apache/tsfile/read/reader/chunk/AbstractChunkReader.java
+++ b/java/tsfile/src/main/java/org/apache/tsfile/read/reader/chunk/AbstractChunkReader.java
@@ -40,6 +40,10 @@ public abstract class AbstractChunkReader implements IChunkReader {
           TSEncoding.valueOf(TSFileDescriptor.getInstance().getConfig().getTimeEncoder()),
           TSDataType.INT64);
 
+  protected Decoder getTimeDecoder(TSEncoding actualTimeEncoding) {
+    return Decoder.getDecoderByType(actualTimeEncoding, TSDataType.INT64);
+  }
+
   protected final long readStopTime;
 
   // any filter, no matter value filter or time filter
diff --git a/java/tsfile/src/main/java/org/apache/tsfile/read/reader/chunk/ChunkReader.java b/java/tsfile/src/main/java/org/apache/tsfile/read/reader/chunk/ChunkReader.java
index c2b2301d7..9d917fa8d 100644
--- a/java/tsfile/src/main/java/org/apache/tsfile/read/reader/chunk/ChunkReader.java
+++ b/java/tsfile/src/main/java/org/apache/tsfile/read/reader/chunk/ChunkReader.java
@@ -153,7 +153,7 @@ private PageReader constructPageReader(PageHeader pageHeader) {
                 chunkDataBuffer.array(), currentPagePosition, unCompressor, encryptParam),
             chunkHeader.getDataType(),
             chunkHeader.calculateDecoderForNonTimeChunk(),
-            defaultTimeDecoder,
+            getTimeDecoder(chunkHeader.getEncodingType()),
             queryFilter);
     reader.setDeleteIntervalList(deleteIntervalList);
     return reader;

From 24f43678b2805c2815f58813b58d05cacfccb80b Mon Sep 17 00:00:00 2001
From: 761417898 <761417898@qq.com>
Date: Thu, 30 Apr 2026 17:52:15 +0800
Subject: [PATCH 5/5] Trim redundant comments and remove dead time decoder
 field.

Drop nonessential explanatory comments in TS_2DIFF codec changes and remove unused defaultTimeDecoder from AbstractChunkReader to keep the PR focused for review.
---
 cpp/src/encoding/ts2diff_decoder.h            |  8 +++-----
 cpp/src/encoding/ts2diff_encoder.h            | 20 +++++++------------
 cpp/test/encoding/ts2diff_codec_test.cc       |  2 --
 .../reader/chunk/AbstractChunkReader.java     |  6 ------
 4 files changed, 10 insertions(+), 26 deletions(-)

diff --git a/cpp/src/encoding/ts2diff_decoder.h b/cpp/src/encoding/ts2diff_decoder.h
index 416cfa3de..fcaff771c 100644
--- a/cpp/src/encoding/ts2diff_decoder.h
+++ b/cpp/src/encoding/ts2diff_decoder.h
@@ -35,8 +35,7 @@ namespace storage {
 
 namespace ts2diff_java_detail {
 
-// Java FloatEncoder overflow flush uses Integer.MAX_VALUE - 1; FloatDecoder
-// then reads BitMaps and Float.intBitsToFloat for float/double TS_2DIFF pages.
+// Java float/double TS_2DIFF overflow page markers.
 constexpr uint32_t kJavaFloatTs2DiffOverflowMagic =
     2147483646u;  // Integer.MAX_VALUE - 1
 constexpr uint32_t kJavaFloatTs2DiffUnderflowMagic =
@@ -120,14 +119,13 @@ inline int consume_float_double_ts2diff_prefix(
         return common::E_OK;
     }
 
-    // Possible non-overflow Java-style prefix (maxPointNumber) OR legacy raw
-    // C++ TS_2DIFF block (no prefix). Probe header to distinguish.
+    // Distinguish Java maxPointNumber prefix from legacy raw C++ block.
     max_point_number = static_cast<int>(tag);
     if (!looks_like_ts2diff_header(in)) {
         in.set_read_pos(mark);
         is_legacy_raw = true;
     } else {
-        segment_size = 0;  // unknown; determined by TS2DIFF block header
+        segment_size = 0;
     }
     return common::E_OK;
 }
diff --git a/cpp/src/encoding/ts2diff_encoder.h b/cpp/src/encoding/ts2diff_encoder.h
index a94b6b57e..4e5d0ba4e 100644
--- a/cpp/src/encoding/ts2diff_encoder.h
+++ b/cpp/src/encoding/ts2diff_encoder.h
@@ -297,19 +297,17 @@ class FloatTS2DIFFEncoder : public TS2DIFFEncoder<int32_t> {
                     static_cast<float>(std::numeric_limits<int32_t>::max()) ||
                 value <
                     static_cast<float>(std::numeric_limits<int32_t>::min())) {
-                underflow_flags_.push_back(-1);  // value itself overflow
+                underflow_flags_.push_back(-1);
                 return common::float_to_int(value);
             }
-            underflow_flags_.push_back(
-                0);  // scaled overflow, keep rounded value
+            underflow_flags_.push_back(0);
             return static_cast<int32_t>(std::lround(value));
         }
         if (std::isnan(value)) {
             underflow_flags_.push_back(-1);
             return common::float_to_int(value);
         }
-        underflow_flags_.push_back(
-            1);  // scaled and will divide by max_point_value_
+        underflow_flags_.push_back(1);
         return static_cast<int32_t>(std::lround(scaled));
     }
     bool has_overflow() const {
@@ -351,19 +349,17 @@ class DoubleTS2DIFFEncoder : public TS2DIFFEncoder<int64_t> {
                     static_cast<double>(std::numeric_limits<int64_t>::max()) ||
                 value <
                     static_cast<double>(std::numeric_limits<int64_t>::min())) {
-                underflow_flags_.push_back(-1);  // value itself overflow
+                underflow_flags_.push_back(-1);
                 return common::double_to_long(value);
             }
-            underflow_flags_.push_back(
-                0);  // scaled overflow, keep rounded value
+            underflow_flags_.push_back(0);
             return static_cast<int64_t>(std::llround(value));
         }
         if (std::isnan(value)) {
             underflow_flags_.push_back(-1);
             return common::double_to_long(value);
         }
-        underflow_flags_.push_back(
-            1);  // scaled and will divide by max_point_value_
+        underflow_flags_.push_back(1);
         return static_cast<int64_t>(std::llround(scaled));
     }
     bool has_overflow() const {
@@ -488,9 +484,7 @@ FORCE_INLINE int DoubleTS2DIFFEncoder::encode(double value,
     return do_encode(value, out);
 }
 
-// Align with Java FloatEncoder TS_2DIFF page layout (overflow flush): outer
-// header + BitMaps so FloatDecoder uses Float.intBitsToFloat on every value
-// (C++ stores IEEE float bits, not scaled decimals).
+// Keep float/double TS_2DIFF page layout compatible with Java.
 FORCE_INLINE int FloatTS2DIFFEncoder::flush(common::ByteStream& out_stream) {
     int ret = common::E_OK;
     if (write_index_ == -1) {
diff --git a/cpp/test/encoding/ts2diff_codec_test.cc b/cpp/test/encoding/ts2diff_codec_test.cc
index 317773d92..755338b30 100644
--- a/cpp/test/encoding/ts2diff_codec_test.cc
+++ b/cpp/test/encoding/ts2diff_codec_test.cc
@@ -65,8 +65,6 @@ class TS2DIFFCodecTest : public ::testing::Test {
     LongTS2DIFFDecoder* decoder_long_;
 };
 
-// Float/double TS_2DIFF: page layout must match Java FloatEncoder (overflow
-// flush) so cross-language readers see Float.intBitsToFloat values.
 class FloatDoubleTS2DIFFCodecTest : public ::testing::Test {
    protected:
     void SetUp() override {
diff --git a/java/tsfile/src/main/java/org/apache/tsfile/read/reader/chunk/AbstractChunkReader.java b/java/tsfile/src/main/java/org/apache/tsfile/read/reader/chunk/AbstractChunkReader.java
index 5defe047d..aa675ba38 100644
--- a/java/tsfile/src/main/java/org/apache/tsfile/read/reader/chunk/AbstractChunkReader.java
+++ b/java/tsfile/src/main/java/org/apache/tsfile/read/reader/chunk/AbstractChunkReader.java
@@ -19,7 +19,6 @@
 
 package org.apache.tsfile.read.reader.chunk;
 
-import org.apache.tsfile.common.conf.TSFileDescriptor;
 import org.apache.tsfile.encoding.decoder.Decoder;
 import org.apache.tsfile.enums.TSDataType;
 import org.apache.tsfile.file.metadata.enums.TSEncoding;
@@ -35,11 +34,6 @@
 
 public abstract class AbstractChunkReader implements IChunkReader {
 
-  protected final Decoder defaultTimeDecoder =
-      Decoder.getDecoderByType(
-          TSEncoding.valueOf(TSFileDescriptor.getInstance().getConfig().getTimeEncoder()),
-          TSDataType.INT64);
-
   protected Decoder getTimeDecoder(TSEncoding actualTimeEncoding) {
     return Decoder.getDecoderByType(actualTimeEncoding, TSDataType.INT64);
   }